Search Options

Results per page
Sort
Preferred Languages
Advance

Results 41 - 50 of 65 for urlset (0.02 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/http/HcHttpClientTest.java

        // public ResponseData call() throws Exception {
        // String[] urls =
        // new String[] {
        // "http://.../",
        // "http://.../test.pdf",
        // "http://.../test.doc",
        // "http://.../test.xls",
        // "http://.../test.ppt",
        // "http://.../test.txt", };
        // for (String url : urls) {
        // ResponseData responseData = httpClient.doGet(url);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.7K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

         * Test match with no patterns configured
         */
        public void test_match_noPatterns() {
            String sessionId = "test-session-009";
            urlFilter.init(sessionId);
    
            // Without any patterns, all URLs should match
            assertTrue(urlFilter.match("https://example.com/"));
            assertTrue(urlFilter.match("https://test.com/page"));
            assertTrue(urlFilter.match("ftp://files.com/document.pdf"));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb1/SmbAuthentication.java

     *
     * <p>
     * It provides methods to set and retrieve the server address, port, username,
     * password, and domain. Additionally, it offers a method to construct a path
     * prefix for SMB1 URLs based on the configured server and port.
     * </p>
     *
     * <p>
     * The path prefix is in the format "smb1://server:port/", where the port is
     * included only if it's greater than 0. If the server is not set, the path
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Sep 18 09:30:45 UTC 2025
    - 3.9K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ResponseData.java

         */
        public void removeChildUrl(final RequestData url) {
            childUrlSet.remove(url);
        }
    
        /**
         * Gets the set of child URLs discovered from this response.
         *
         * @return the set of child URLs
         */
        public Set<RequestData> getChildUrlSet() {
            return childUrlSet;
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 11.6K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/LogHelperImpl.java

     * <p>
     * The class contains methods for logging different types of events, such as:
     * </p>
     * <ul>
     *   <li>Starting and finishing threads</li>
     *   <li>Starting and cleaning up crawling</li>
     *   <li>Handling unsupported URLs</li>
     *   <li>Checking last modified dates</li>
     *   <li>Getting content</li>
     *   <li>Handling redirects</li>
     *   <li>Processing responses</li>
     *   <li>Handling exceptions during crawling and child URL processing</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb/SmbAuthentication.java

     *
     * <p>
     * It provides methods to set and retrieve the server address, port, username,
     * password, and domain. Additionally, it offers a method to construct a path
     * prefix for SMB URLs based on the configured server and port.
     * </p>
     *
     * <p>
     * The path prefix is in the format "smb://server:port/", where the port is
     * included only if it's greater than 0. If the server is not set, the path
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.9K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/UrlQueueService.java

    import java.util.List;
    
    import org.codelibs.fess.crawler.entity.UrlQueue;
    
    /**
     * Service interface for managing URL queues.
     * Provides methods for adding, retrieving, and managing URLs within a crawling session.
     *
     * @param <QUEUE> the type of URL queue
     */
    public interface UrlQueueService<QUEUE extends UrlQueue<?>> {
    
        /**
         * Updates the session ID.
         *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  8. src/test/java/org/codelibs/opensearch/extension/analysis/NGramSynonymTokenizer.java

        }
    
        @Override
        public void end() throws IOException {
            super.end();
            offsetAttr.setOffset(finalOffset, finalOffset);
        }
    
        @Override
        public void reset() throws IOException {
            super.reset();
            block.setLength(0);
            prevToken = null;
            readBufferIndex = BUFFER_SIZE;
            readBufferLen = 0;
            ch = 0;
            blkStart = 0;
            nextBlkStart = 0;
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sat Mar 15 06:51:20 UTC 2025
    - 17K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

                if (logger.isInfoEnabled()) {
                    logger.info("Use a default encoding: " + encoding, e);
                }
            } finally {
                try {
                    bis.reset();
                } catch (final IOException e) {
                    throw new ExtractException(e);
                }
            }
    
            return encoding;
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/CrawlingAccessException.java

     * It extends CrawlerSystemException and provides functionality to set and check the log level for the exception.
     *
     * <p>
     * This exception can be thrown when there are problems accessing URLs, files, or any other resources needed for crawling.
     * It includes constructors to handle messages, causes, or both.
     * </p>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.8K bytes
    - Viewed (0)
Back to top