Search Options

Display Count
Sort
Preferred Language
Advanced Search

Results 1 - 10 of 12 for CrawlerContext (0.12 seconds)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java

     * </p>
     *
     * <p>
     * It also provides thread-local storage for sitemaps, allowing each thread to have its own set of sitemaps.
     * </p>
     */
    public class CrawlerContext {
        /**
         * Constructs a new CrawlerContext.
         */
        public CrawlerContext() {
            // Default constructor
        }
    
        /**
         * Session identifier for the crawling session.
         */
        protected String sessionId;
    
        /**
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Wed Dec 31 09:07:38 GMT 2025
    - 9K bytes
    - Click Count (0)
  2. src/main/java/org/codelibs/fess/helper/CrawlerLogHelper.java

            final UrlQueue<?> urlQueue = objs.length > 1 && objs[1] instanceof UrlQueue<?> ? (UrlQueue<?>) objs[1] : null;
            try {
                final CrawlerContext crawlerContext = (CrawlerContext) objs[0];
                final Throwable e = (Throwable) objs[2];
    
                storeFailureUrl(crawlerContext, urlQueue, e.getClass().getCanonicalName(), e);
            } catch (final ContainerNotAvailableException e) {
                if (logger.isDebugEnabled()) {
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 8.3K bytes
    - Click Count (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

                        crawlerContext.getNumOfThread(), crawlerContext.maxDepth, crawlerContext.maxAccessCount);
            }
    
            // context
            crawlerContext.urlFilter = urlFilter;
            crawlerContext.ruleManager = ruleManager;
            crawlerContext.intervalController = intervalController;
    
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Mon Nov 24 03:59:47 GMT 2025
    - 17K bytes
    - Click Count (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

            this.clientFactory = clientFactory;
        }
    
        /**
         * Sets the crawler context.
         * @param crawlerContext The CrawlerContext instance.
         */
        public void setCrawlerContext(final CrawlerContext crawlerContext) {
            this.crawlerContext = crawlerContext;
        }
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Wed Dec 31 09:07:38 GMT 2025
    - 20.3K bytes
    - Click Count (0)
  5. src/main/java/org/codelibs/fess/helper/WebFsIndexHelper.java

                // num of threads
                final CrawlerContext crawlerContext = crawler.getCrawlerContext();
                final int numOfThread =
                        webConfig.getNumOfThread() != null ? webConfig.getNumOfThread() : Constants.DEFAULT_NUM_OF_THREAD_FOR_WEB;
                crawlerContext.setNumOfThread(numOfThread);
    
                // depth
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 25K bytes
    - Click Count (0)
  6. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                assertFalse(crawler1.crawlerContext == crawler2.crawlerContext);
    
                for (int i = 0; i < 100; i++) {
                    if (crawler1.crawlerContext.getStatus() == CrawlerStatus.RUNNING) {
                        break;
                    }
                    Thread.sleep(50);
                }
                assertEquals(CrawlerStatus.RUNNING, crawler1.crawlerContext.getStatus());
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Thu Jan 15 01:11:43 GMT 2026
    - 7.8K bytes
    - Click Count (0)
  7. CLAUDE.md

    ---
    
    ## Key Components
    
    ### Core Classes
    
    - **Crawler** (`Crawler.java`): Main orchestrator - `execute()`, `addUrl()`, `cleanup()`, `stop()`
    - **CrawlerContext** (`CrawlerContext.java`): Execution context - `sessionId`, `status`, `accessCount`, `numOfThread`, `maxDepth`, `maxAccessCount`
    - **CrawlerThread** (`CrawlerThread.java`): Worker thread - Poll URL → Validate → Execute → Process → Queue children
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Thu Mar 12 03:39:20 GMT 2026
    - 8.1K bytes
    - Click Count (0)
  8. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                assertFalse(sessionId1 == sessionId2);
                assertFalse(crawler1.crawlerContext == crawler2.crawlerContext);
    
                // Wait for both crawlers to start with polling
                long startTime = System.currentTimeMillis();
                while ((crawler1.crawlerContext.getStatus() != CrawlerStatus.RUNNING
                        || crawler2.crawlerContext.getStatus() != CrawlerStatus.RUNNING) && System.currentTimeMillis() - startTime < 5000) {
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Thu Jan 15 01:11:43 GMT 2026
    - 13.1K bytes
    - Click Count (0)
  9. README.md

    ```java
    // Set maximum number of URLs to crawl
    crawler.crawlerContext.setMaxAccessCount(1000);
    
    // Set number of crawler threads
    crawler.crawlerContext.setNumOfThread(10);
    
    // Set maximum crawl depth
    crawler.crawlerContext.setMaxDepth(3);
    
    // Set request interval (politeness)
    crawler.crawlerContext.setDefaultIntervalTime(1000); // 1 second
    ```
    
    ### URL Filtering
    
    ```java
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Sun Aug 31 05:32:52 GMT 2025
    - 15.3K bytes
    - Click Count (0)
  10. src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java

                        log(logHelper, LogType.NOT_MODIFIED, crawlerContext, urlQueue);
    
                        responseData.setExecutionTime(systemHelper.getCurrentTimeAsLong() - startTime);
                        responseData.setParentUrl(urlQueue.getParentUrl());
                        responseData.setSessionId(crawlerContext.getSessionId());
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Thu Dec 11 09:47:03 GMT 2025
    - 19.5K bytes
    - Click Count (0)
Back to Top