Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 45 for 1000 (0.01 sec)

  1. README.md

    ```java
    // Set maximum number of URLs to crawl
    crawler.crawlerContext.setMaxAccessCount(1000);
    
    // Set number of crawler threads
    crawler.crawlerContext.setNumOfThread(10);
    
    // Set maximum crawl depth
    crawler.crawlerContext.setMaxDepth(3);
    
    // Set request interval (politeness)
    crawler.crawlerContext.setDefaultIntervalTime(1000); // 1 second
    ```
    
    ### URL Filtering
    
    ```java
    // Include patterns
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java

            // Add URLs up to capacity (10000)
            for (int i = 0; i < 10000; i++) {
                urlSet.add("http://example" + i + ".com/robots.txt");
            }
            assertEquals(10000, urlSet.size());
    
            // Add one more should maintain size at 10000 (LRU eviction)
            urlSet.add("http://overflow.com/robots.txt");
            assertEquals(10000, urlSet.size());
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 25.6K bytes
    - Viewed (0)
  3. src/test/java/org/codelibs/fess/suggest/SuggesterTest.java

            AtomicInteger numObInputDoc = new AtomicInteger(0);
            ESSourceReader reader = new ESSourceReader(client, suggester.settings(), indexName);
            reader.setScrollSize(1000);
    
            suggester.indexer().indexFromDocument(() -> reader, 1000, () -> ThreadUtil.sleep(100)).then(response -> {
                numObInputDoc.set(response.getNumberOfInputDocs());
                latch.countDown();
            }).error(t -> {
                t.printStackTrace();
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 37.2K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

            // Create multiple threads adding patterns
            Thread thread1 = new Thread(() -> {
                for (int i = 0; i < 100; i++) {
                    urlFilter.addInclude("https://site" + i + ".com/.*");
                }
            });
    
            Thread thread2 = new Thread(() -> {
                for (int i = 0; i < 100; i++) {
                    urlFilter.addExclude(".*\\.type" + i + "$");
                }
            });
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/suggest/index/contents/document/ESSourceReader.java

            } else {
                this.limitPercentage = Integer.parseInt(limitPercentage);
            }
    
            if (this.limitPercentage > 100) {
                this.limitPercentage = 100;
            } else if (this.limitPercentage < 1) {
                this.limitPercentage = 1;
            }
        }
    
        /**
         * Sets the limit number.
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 11K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/TextUtil.java

     * <pre>{@code
     * Reader reader = new StringReader("Example text to normalize.");
     * String normalizedText = TextUtil.normalizeText(reader)
     *                                  .initialCapacity(5000)
     *                                  .maxAlphanumTermSize(100)
     *                                  .maxSymbolTermSize(50)
     *                                  .duplicateTermRemoved(true)
     *                                  .spaceChars(new int[] { ' ', '\u00a0' })
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractor.java

         * @return the extracted body text
         * @throws ExtractException if extraction fails
         */
        protected String getBodyText(final MimeMessage message) {
            final StringBuilder buf = new StringBuilder(1000);
            try {
                final Object content = message.getContent();
                if (content instanceof final Multipart multipart) {
                    final int count = multipart.getCount();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.6K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/suggest/index/contents/DefaultContentsParser.java

        private final int maxAnalyzedContentLength;
    
        /**
         * Constructor.
         */
        public DefaultContentsParser() {
            maxAnalyzedContentLength = Integer.getInteger("fess.suggest.max.analyzed.content.length", 1000);
        }
    
        @Override
        public SuggestItem parseSearchWords(final String[] words, final String[][] readings, final String[] fields, final String[] tags,
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Fri Jul 04 14:00:23 UTC 2025
    - 15.4K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java

                throw new CrawlingAccessException("Could not parse " + responseData.getUrl(), e);
            }
            final Document document = parser.getDocument();
    
            final StringBuilder buf = new StringBuilder(1000);
            buf.append(getResultDataHeader());
            for (final Map.Entry<String, String> entry : fieldRuleMap.entrySet()) {
                final String path = entry.getValue();
                try {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/CommandExtractor.java

        protected long executionTimeout = 30L * 1000L; // 30sec
    
        /** The working directory for the command. */
        protected File workingDirectory = null;
    
        /** The encoding for the command's output. */
        protected String commandOutputEncoding = Charset.defaultCharset().displayName();
    
        /** The maximum number of lines to buffer from command output. */
        protected int maxOutputLine = 1000;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 16K bytes
    - Viewed (0)
Back to top