Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 10 for getCrawlerContext (0.07 sec)

  1. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                crawler.setBackground(true);
                ((UrlFilterImpl) crawler.urlFilter).setIncludeFilteringPattern("$1$2$3.*");
                crawler.addUrl(url);
                crawler.getCrawlerContext().setMaxAccessCount(maxCount);
                crawler.getCrawlerContext().setNumOfThread(numOfThread);
                final String sessionId = crawler.execute();
    
                // Wait for crawler to start running with polling
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 12.8K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

            testCrawler.setNumOfThread(5);
            assertEquals(5, testCrawler.getCrawlerContext().getNumOfThread());
    
            testCrawler.setMaxThreadCheckCount(15);
            assertEquals(15, testCrawler.getCrawlerContext().getMaxThreadCheckCount());
    
            testCrawler.setMaxDepth(10);
            assertEquals(10, testCrawler.getCrawlerContext().getMaxDepth());
    
            testCrawler.setMaxAccessCount(100);
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Tue Nov 11 13:40:14 UTC 2025
    - 25.8K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CrawlingParameterUtilTest.java

            assertNull(CrawlingParameterUtil.getCrawlerContext());
    
            // Create and set a CrawlerContext
            CrawlerContext context = new CrawlerContext();
            context.setSessionId("test-context-session");
    
            CrawlingParameterUtil.setCrawlerContext(context);
    
            // Verify it can be retrieved
            CrawlerContext retrieved = CrawlingParameterUtil.getCrawlerContext();
            assertNotNull(retrieved);
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 14.6K bytes
    - Viewed (0)
  4. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                file.mkdirs();
                file.deleteOnExit();
                fileTransformer.setPath(file.getAbsolutePath());
                crawler.addUrl(url);
                crawler.getCrawlerContext().setMaxAccessCount(maxCount);
                crawler.getCrawlerContext().setNumOfThread(numOfThread);
                crawler.urlFilter.addInclude(url + ".*");
                final String sessionId = crawler.execute();
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/helper/WebFsIndexHelper.java

                        if (crawlerList.get(i).getCrawlerContext().getStatus() == CrawlerStatus.DONE
                                && Constants.RUNNING.equals(crawlerStatusList.get(i))) {
                            crawlerList.get(i).awaitTermination();
                            crawlerStatusList.set(i, Constants.DONE);
                            final String sid = crawlerList.get(i).getCrawlerContext().getSessionId();
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 25K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CrawlingParameterUtil.java

     * <p>Usage example:</p>
     * <pre>
     * {@code
     * UrlQueue<?> urlQueue = CrawlingParameterUtil.getUrlQueue();
     * CrawlingParameterUtil.setUrlQueue(newUrlQueue);
     *
     * CrawlerContext context = CrawlingParameterUtil.getCrawlerContext();
     * CrawlingParameterUtil.setCrawlerContext(newContext);
     *
     * UrlQueueService<UrlQueue<?>> urlQueueService = CrawlingParameterUtil.getUrlQueueService();
     * CrawlingParameterUtil.setUrlQueueService(newUrlQueueService);
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Nov 22 13:28:22 UTC 2025
    - 6.4K bytes
    - Viewed (0)
  7. CLAUDE.md

    ```java
    // Set (in CrawlerThread)
    CrawlingParameterUtil.setCrawlerContext(context);
    CrawlingParameterUtil.setUrlQueue(urlQueue);
    
    // Get (anywhere in same thread)
    CrawlerContext ctx = CrawlingParameterUtil.getCrawlerContext();
    
    // Clear (ALWAYS in finally)
    CrawlingParameterUtil.clearAll();
    ```
    
    ## Log Message Guidelines
    
    - Format parameters as `key=value` (e.g., `sessionId={}`, `url={}`)
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 28 17:31:34 UTC 2025
    - 10.7K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java

         */
        protected void processResult(final UrlQueue<?> urlQueue, final ResponseData responseData, final ResultData resultData) {
            final CrawlerContext crawlerContext = CrawlingParameterUtil.getCrawlerContext();
            final UrlQueueService<UrlQueue<?>> urlQueueService = CrawlingParameterUtil.getUrlQueueService();
            if (!urlQueueService.visited(urlQueue)) {
                if (checkAccessCount(crawlerContext)) {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 12.5K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

            }
        }
    
        /**
         * Returns the crawler context.
         * @return The CrawlerContext instance.
         */
        public CrawlerContext getCrawlerContext() {
            return crawlerContext;
        }
    
        /**
         * Sets the number of threads.
         * @param numOfThread The number of threads.
         */
        public void setNumOfThread(final int numOfThread) {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 17K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

                // not support robots.txt
                return;
            }
    
            // crawler context
            final CrawlerContext crawlerContext = CrawlingParameterUtil.getCrawlerContext();
            if (crawlerContext == null) {
                // wrong state
                return;
            }
    
            final int idx = url.indexOf('/', url.indexOf("://") + 3);
            String hostUrl;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 53.7K bytes
    - Viewed (0)
Back to top