Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 70 for dela (0.02 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/interval/impl/AbstractIntervalControllerTest.java

        }
    
        /**
         * Test multiple delay calls
         */
        public void test_multipleDelayCalls() {
            final TestIntervalController controller = new TestIntervalController();
    
            controller.delay(IntervalController.PRE_PROCESSING);
            controller.delay(IntervalController.POST_PROCESSING);
            controller.delay(IntervalController.NO_URL_IN_QUEUE);
            controller.delay(IntervalController.WAIT_NEW_URL);
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 20 08:58:39 UTC 2025
    - 9.8K bytes
    - Viewed (0)
  2. src/main/resources/fess_indices/fess/fr/stopwords.txt

    avais
    avait
    avions
    aviez
    avaient
    eut
    eûmes
    eûtes
    eurent
    aie
    aies
    ait
    ayons
    ayez
    aient
    eusse
    eusses
    eût
    eussions
    eussiez
    eussent
    ceci
    cela
    celà
    cet
    cette
    ici
    ils
    les
    leurs
    quel
    quels
    quelle
    quelles
    sans
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Mon Nov 27 12:59:36 UTC 2023
    - 977 bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/IntervalController.java

        int NO_URL_IN_QUEUE = 4;
    
        /** Constant indicating that the crawler is waiting for new URLs. */
        int WAIT_NEW_URL = 8;
    
        /**
         * Introduces a delay based on the specified type.
         *
         * @param type the type of delay to be introduced
         */
        void delay(int type);
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.8K bytes
    - Viewed (0)
  4. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots.txt

    User-agent: FessCrawler
    Disallow:           # allows all 
    
    User-agent: BruteBot
    Disallow: /
    Allow: /foo/bar/
    Crawl-delay: 1314000
    
    # welcome!
    User-agent: Googlebot
    Crawl-delay: 1
    
    User-agent: *
    Disallow: /private/
    Disallow: /help        # disallows /help.html, /help/index.html, etc.
    Allow: /help/faq.html
    Crawl-delay: 3
    
    User-agent: Crawler
    Disallow: /aaa
    
    User-agent: Crawler/1.0
    Disallow: /bbb
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 566 bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/DefaultIntervalController.java

        /** Delay in milliseconds after processing a URL */
        protected long delayMillisAfterProcessing = 0L;
    
        /** Delay in milliseconds when no URL is in the queue */
        protected long delayMillisAtNoUrlInQueue = 500L;
    
        /** Delay in milliseconds before processing a URL */
        protected long delayMillisBeforeProcessing = 0L;
    
        /** Delay in milliseconds for waiting for new URLs */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 20 08:58:39 UTC 2025
    - 5.8K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/HostIntervalController.java

     * The delayBeforeProcessing method is overridden to introduce a delay before processing a URL,
     * ensuring that requests to the same host are not made too frequently.
     * The delay is calculated based on the configured delayMillisBeforeProcessing parameter.
     * If the time since the last request to the host is less than the configured delay,
     * the thread waits until the delay has elapsed.
     * This class is thread-safe.
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 5.2K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/crawler/interval/FessIntervalController.java

            super();
        }
    
        /**
         * Gets the delay time in milliseconds after processing a URL.
         *
         * @return the delay time in milliseconds after processing
         */
        public long getDelayMillisAfterProcessing() {
            return delayMillisAfterProcessing;
        }
    
        /**
         * Sets the delay time in milliseconds after processing a URL.
         *
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Wed Nov 19 07:09:17 UTC 2025
    - 5.1K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/interval/impl/DefaultIntervalControllerTest.java

            controller.delayAfterProcessing();
            final long elapsed = (System.nanoTime() - start) / 1000000;
    
            assertTrue("No delay expected", elapsed < 50); // Should be nearly instant
        }
    
        /**
         * Test delayAfterProcessing with actual delay
         */
        public void test_delayAfterProcessing_withDelay() {
            final DefaultIntervalController controller = new DefaultIntervalController();
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 20 08:58:39 UTC 2025
    - 8.1K bytes
    - Viewed (0)
  9. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots_malformed.txt

    Disallow: /admin/
    InvalidDirective: some-value
    unknown-field: test
    Disallow /missing-colon
    Disallow:    # empty value (should be treated as allowing all)
    Allow: /public/
    Crawl-delay: invalid-number
    Crawl-delay: -10
    Crawl-delay: 5.5
    Crawl-delay:
    Allow:    # empty value
    
    # Case 3: Multiple colons in directive
    User-agent: MultiColonBot
    Disallow: http://example.com:8080/path
    Allow: /path:with:colons
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 14 12:52:01 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

        }
    
        /**
         * Gets the crawl delay value for the specified user agent from robots.txt.
         * The crawl delay specifies the time (in seconds) to wait between successive requests.
         *
         * @param userAgent The user agent string to match against robots.txt directives
         * @return The crawl delay value in seconds. Returns 0 if no matching directive is found
         *         or no crawl delay is specified for the matching directive.
         */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 18.5K bytes
    - Viewed (0)
Back to top