Search Options

Results per page
Sort
Preferred Languages
Advance

Results 31 - 40 of 58 for Burles (0.11 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/UrlQueueServiceImpl.java

     * This class provides methods for managing a queue of URLs to be crawled,
     * including adding, deleting, and retrieving URLs from the queue.
     * It uses a {@link MemoryDataHelper} to store the URL queue data in memory.
     *
     * <p>
     * The class is responsible for:
     * </p>
     * <ul>
     *   <li>Updating session IDs for URL queues.</li>
     *   <li>Adding new URLs to the queue.</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/AbstractIntervalController.java

     * <ul>
     *   <li>Before processing a URL ({@link #delayBeforeProcessing()})</li>
     *   <li>After processing a URL ({@link #delayAfterProcessing()})</li>
     *   <li>When there are no URLs in the queue ({@link #delayAtNoUrlInQueue()})</li>
     *   <li>While waiting for new URLs to be added to the queue ({@link #delayForWaitingNewUrl()})</li>
     * </ul>
     *
     * <p>
     * Subclasses are responsible for implementing the abstract methods to define the actual delay
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ResultData.java

        protected String transformerName;
    
        /** The data of the result. */
        protected byte[] data;
    
        /** The encoding of the result. */
        protected String encoding;
    
        /** The set of the child URLs. */
        protected Set<RequestData> childUrlSet = new LinkedHashSet<>();
    
        /** The raw data. */
        protected Object rawData = null;
    
        /** The serializer. */
        protected Function<Object, byte[]> serializer;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.7K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/http/HcHttpClientTest.java

        // public ResponseData call() throws Exception {
        // String[] urls =
        // new String[] {
        // "http://.../",
        // "http://.../test.pdf",
        // "http://.../test.doc",
        // "http://.../test.xls",
        // "http://.../test.ppt",
        // "http://.../test.txt", };
        // for (String url : urls) {
        // ResponseData responseData = httpClient.doGet(url);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.7K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java

    import org.xml.sax.InputSource;
    
    /**
     * {@link XpathTransformer} is a class that transforms HTML content into XML format based on XPath expressions.
     * It extracts data from an HTML document by applying XPath rules defined in {@link #fieldRuleMap}.
     * The extracted data is then formatted into an XML structure and stored in the {@link ResultData}.
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.1K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

         * Test match with no patterns configured
         */
        public void test_match_noPatterns() {
            String sessionId = "test-session-009";
            urlFilter.init(sessionId);
    
            // Without any patterns, all URLs should match
            assertTrue(urlFilter.match("https://example.com/"));
            assertTrue(urlFilter.match("https://test.com/page"));
            assertTrue(urlFilter.match("ftp://files.com/document.pdf"));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

                logHelper.log(key, objs);
            }
        }
    
        /**
         * Runs the crawling process in a separate thread.
         * This method fetches URLs from the queue, accesses content, processes responses,
         * and extracts child URLs until the crawling process is done or no more URLs are available.
         */
        @Override
        public void run() {
            log(logHelper, LogType.START_THREAD, crawlerContext);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/LogHelperImpl.java

     * <p>
     * The class contains methods for logging different types of events, such as:
     * </p>
     * <ul>
     *   <li>Starting and finishing threads</li>
     *   <li>Starting and cleaning up crawling</li>
     *   <li>Handling unsupported URLs</li>
     *   <li>Checking last modified dates</li>
     *   <li>Getting content</li>
     *   <li>Handling redirects</li>
     *   <li>Processing responses</li>
     *   <li>Handling exceptions during crawling and child URL processing</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb1/SmbAuthentication.java

     *
     * <p>
     * It provides methods to set and retrieve the server address, port, username,
     * password, and domain. Additionally, it offers a method to construct a path
     * prefix for SMB1 URLs based on the configured server and port.
     * </p>
     *
     * <p>
     * The path prefix is in the format "smb1://server:port/", where the port is
     * included only if it's greater than 0. If the server is not set, the path
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Sep 18 09:30:45 UTC 2025
    - 3.9K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientFactory.java

                    logger.debug("CrawlerClientCreator is unavailable.", e);
                }
            }
        }
    
        /**
         * Adds a client with a regular expression pattern.
         * @param regex The regular expression to match URLs.
         * @param client The CrawlerClient instance.
         */
        public void addClient(final String regex, final CrawlerClient client) {
            if (StringUtil.isBlank(regex)) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7K bytes
    - Viewed (0)
Back to top