- Sort Score
- Num 10 results
- Language All
Results 11 - 20 of 485 for crawlers (0.05 seconds)
-
src/main/java/org/codelibs/fess/exec/Crawler.java
* </pre> */ public class Crawler { /** * Creates a new instance of Crawler. */ public Crawler() { // Default constructor } /** Logger instance for this class. */ private static final Logger logger = LogManager.getLogger(Crawler.class); /** Thread name for web and file system crawling process. */Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Mar 26 02:24:08 GMT 2026 - 32.4K bytes - Click Count (0) -
README.md
```java // Create multiple crawler instances Crawler crawler1 = container.getComponent("crawler"); crawler1.setSessionId("session1"); crawler1.addUrl("https://site1.com"); Crawler crawler2 = container.getComponent("crawler"); crawler2.setSessionId("session2"); crawler2.addUrl("https://site2.com"); // Execute concurrently crawler1.setBackground(true); crawler2.setBackground(true);
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Sun Aug 31 05:32:52 GMT 2025 - 15.3K bytes - Click Count (0) -
fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
crawler1.getCrawlerContext().setMaxAccessCount(maxCount); crawler1.getCrawlerContext().setNumOfThread(numOfThread); final Crawler crawler2 = getComponent(Crawler.class); crawler2.setBackground(true); ((UrlFilterImpl) crawler2.urlFilter).setIncludeFilteringPattern("$1$2$3.*"); crawler2.addUrl(url2); crawler2.getCrawlerContext().setMaxAccessCount(maxCount);
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Jan 15 01:11:43 GMT 2026 - 7.8K bytes - Click Count (0) -
samples/crawler/src/main/java/okhttp3/sample/Crawler.java
OkHttpClient client = new OkHttpClient.Builder() .cache(cache) .callTimeout(5, TimeUnit.SECONDS) .build(); Crawler crawler = new Crawler(client, queueLimit, hostLimit); crawler.queue.add(HttpUrl.get(args[1])); crawler.parallelDrainQueue(threadCount); }
Created: Fri Apr 03 11:42:14 GMT 2026 - Last Modified: Wed Jul 23 00:58:06 GMT 2025 - 5K bytes - Click Count (0) -
fess-crawler-lasta/src/main/resources/crawler.xml
<components namespace="fessCrawler"> <include path="crawler/container.xml"/> <include path="crawler/client.xml"/> <include path="crawler/rule.xml"/> <include path="crawler/filter.xml"/> <include path="crawler/interval.xml"/> <include path="crawler/extractor.xml"/> <include path="crawler/mimetype.xml"/> <include path="crawler/encoding.xml"/> <include path="crawler/urlconverter.xml"/> <include path="crawler/log.xml"/>
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Tue Nov 28 13:40:25 GMT 2017 - 1.7K bytes - Click Count (0) -
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/container/LastaCrawlerContainerTest.java
// Verify that multiple components can be retrieved final Crawler crawler1 = crawlerContainer.getComponent("crawler"); final Crawler crawler2 = crawlerContainer.getComponent("crawler"); // They should be different instances (prototype scope) assertNotNull(crawler1); assertNotNull(crawler2); } @Test public void test_isLastaCrawlerContainer() {Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Fri Jan 16 13:52:11 GMT 2026 - 2.7K bytes - Click Count (0) -
src/main/resources/mail/crawler.dfmail
/* [Crawler Notification] Crawler notification mail. */ subject: [FESS] Crawler completed: /*pmb.hostname*/ >>> --- Server Info --- Host Name: /*pmb.hostname:orElse('Unknown')*/ Job Name: /*pmb.jobname:orElse('Unknown')*/ --- Web/FileSystem Crawler --- Start Time: /*pmb.webFsCrawlStartTime:orElse('-')*/ End Time: /*pmb.webFsCrawlEndTime:orElse('-')*/ Exec Time: /*pmb.webFsCrawlExecTime:orElse('-')*/ ms --- Web/FileSystem Indexer ---Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Wed Jan 15 22:05:20 GMT 2020 - 1K bytes - Click Count (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java
* It contains various attributes related to the crawler's state, configuration, and runtime data. * This class provides methods to access and modify these attributes, allowing for control and monitoring * of the crawler's behavior. * * <p> * The context includes information such as the session ID, active thread count, access count, crawler status,
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Wed Dec 31 09:07:38 GMT 2025 - 9K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/crawler/processor/FessResponseProcessor.java
*/ package org.codelibs.fess.crawler.processor; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.fess.crawler.entity.AccessResult; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; import org.codelibs.fess.crawler.processor.impl.DefaultResponseProcessor;
Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Jul 17 08:28:31 GMT 2025 - 3.7K bytes - Click Count (0) -
src/main/resources/fess_label_pl.properties
labels.crawling_info_delete_all_cancel=Anuluj labels.crawling_info_thread_dump=Zrzut wątków labels.crawling_info_CrawlerStartTime=Czas rozpoczęcia crawlera labels.crawling_info_CrawlerEndTime=Czas zakończenia crawlera labels.crawling_info_CrawlerExecTime=Czas wykonania crawlera labels.crawling_info_CrawlerStatus=Status crawlera labels.crawling_info_WebFsCrawlExecTime=Czas wykonania indeksowania (Web/Plik)
Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Sat Mar 28 11:54:13 GMT 2026 - 53.2K bytes - Click Count (0)