- Sort Score
- Num 10 results
- Language All
Results 1 - 10 of 11 for CrawlerContext (0.11 seconds)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java
* </p> * * <p> * It also provides thread-local storage for sitemaps, allowing each thread to have its own set of sitemaps. * </p> */ public class CrawlerContext { /** * Constructs a new CrawlerContext. */ public CrawlerContext() { // Default constructor } /** * Session identifier for the crawling session. */ protected String sessionId; /**Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Wed Dec 31 09:07:38 GMT 2025 - 9K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/helper/CrawlerLogHelper.java
final UrlQueue<?> urlQueue = objs.length > 1 && objs[1] instanceof UrlQueue<?> ? (UrlQueue<?>) objs[1] : null; try { final CrawlerContext crawlerContext = (CrawlerContext) objs[0]; final Throwable e = (Throwable) objs[2]; storeFailureUrl(crawlerContext, urlQueue, e.getClass().getCanonicalName(), e); } catch (final ContainerNotAvailableException e) { if (logger.isDebugEnabled()) {
Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Fri Nov 28 16:29:12 GMT 2025 - 8.3K bytes - Click Count (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java
crawlerContext.getNumOfThread(), crawlerContext.maxDepth, crawlerContext.maxAccessCount); } // context crawlerContext.urlFilter = urlFilter; crawlerContext.ruleManager = ruleManager; crawlerContext.intervalController = intervalController;
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Mon Nov 24 03:59:47 GMT 2025 - 17K bytes - Click Count (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java
this.clientFactory = clientFactory; } /** * Sets the crawler context. * @param crawlerContext The CrawlerContext instance. */ public void setCrawlerContext(final CrawlerContext crawlerContext) { this.crawlerContext = crawlerContext; }Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Wed Dec 31 09:07:38 GMT 2025 - 20.3K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/helper/WebFsIndexHelper.java
// num of threads final CrawlerContext crawlerContext = crawler.getCrawlerContext(); final int numOfThread = webConfig.getNumOfThread() != null ? webConfig.getNumOfThread() : Constants.DEFAULT_NUM_OF_THREAD_FOR_WEB; crawlerContext.setNumOfThread(numOfThread); // depthCreated: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Fri Nov 28 16:29:12 GMT 2025 - 25K bytes - Click Count (0) -
fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
assertFalse(crawler1.crawlerContext == crawler2.crawlerContext); for (int i = 0; i < 100; i++) { if (crawler1.crawlerContext.getStatus() == CrawlerStatus.RUNNING) { break; } Thread.sleep(50); } assertEquals(CrawlerStatus.RUNNING, crawler1.crawlerContext.getStatus());
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Jan 15 01:11:43 GMT 2026 - 7.8K bytes - Click Count (0) -
CLAUDE.md
--- ## Key Components ### Core Classes - **Crawler** (`Crawler.java`): Main orchestrator - `execute()`, `addUrl()`, `cleanup()`, `stop()` - **CrawlerContext** (`CrawlerContext.java`): Execution context - `sessionId`, `status`, `accessCount`, `numOfThread`, `maxDepth`, `maxAccessCount` - **CrawlerThread** (`CrawlerThread.java`): Worker thread - Poll URL → Validate → Execute → Process → Queue children
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Mar 12 03:39:20 GMT 2026 - 8.1K bytes - Click Count (0) -
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
assertFalse(sessionId1 == sessionId2); assertFalse(crawler1.crawlerContext == crawler2.crawlerContext); // Wait for both crawlers to start with polling long startTime = System.currentTimeMillis(); while ((crawler1.crawlerContext.getStatus() != CrawlerStatus.RUNNING || crawler2.crawlerContext.getStatus() != CrawlerStatus.RUNNING) && System.currentTimeMillis() - startTime < 5000) {
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Jan 15 01:11:43 GMT 2026 - 13.1K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java
log(logHelper, LogType.NOT_MODIFIED, crawlerContext, urlQueue); responseData.setExecutionTime(systemHelper.getCurrentTimeAsLong() - startTime); responseData.setParentUrl(urlQueue.getParentUrl()); responseData.setSessionId(crawlerContext.getSessionId());Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Dec 11 09:47:03 GMT 2025 - 19.5K bytes - Click Count (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/Hc4HttpClient.java
// not support robots.txt return; } // crawler context final CrawlerContext crawlerContext = CrawlingParameterUtil.getCrawlerContext(); if (crawlerContext == null) { // wrong state return; } final int idx = url.indexOf('/', url.indexOf("://") + 3); String hostUrl;Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Fri Jan 09 23:46:52 GMT 2026 - 54.4K bytes - Click Count (0)