- Sort Score
- Num 10 results
- Language All
Results 1 - 10 of 311 for Crawler (0.6 seconds)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java
* * <p>Example usage: * <pre> * Crawler crawler = new Crawler(); * crawler.addUrl("http://example.com/"); * crawler.execute(); * crawler.close(); * </pre> */ public class Crawler implements Runnable, AutoCloseable { private static final Logger logger = LogManager.getLogger(Crawler.class); /** * Service for managing URL queues during crawling. */
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Mon Nov 24 03:59:47 GMT 2025 - 17K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/exec/Crawler.java
* </pre> */ public class Crawler { /** * Creates a new instance of Crawler. */ public Crawler() { // Default constructor } /** Logger instance for this class. */ private static final Logger logger = LogManager.getLogger(Crawler.class); /** Thread name for web and file system crawling process. */Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Mar 26 02:24:08 GMT 2026 - 32.4K bytes - Click Count (0) -
samples/crawler/src/main/java/okhttp3/sample/Crawler.java
OkHttpClient client = new OkHttpClient.Builder() .cache(cache) .callTimeout(5, TimeUnit.SECONDS) .build(); Crawler crawler = new Crawler(client, queueLimit, hostLimit); crawler.queue.add(HttpUrl.get(args[1])); crawler.parallelDrainQueue(threadCount); }
Created: Fri Apr 03 11:42:14 GMT 2026 - Last Modified: Wed Jul 23 00:58:06 GMT 2025 - 5K bytes - Click Count (0) -
fess-crawler-lasta/src/main/resources/crawler.xml
<components namespace="fessCrawler"> <include path="crawler/container.xml"/> <include path="crawler/client.xml"/> <include path="crawler/rule.xml"/> <include path="crawler/filter.xml"/> <include path="crawler/interval.xml"/> <include path="crawler/extractor.xml"/> <include path="crawler/mimetype.xml"/> <include path="crawler/encoding.xml"/> <include path="crawler/urlconverter.xml"/> <include path="crawler/log.xml"/>
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Tue Nov 28 13:40:25 GMT 2017 - 1.7K bytes - Click Count (0) -
src/main/resources/mail/crawler.dfmail
/* [Crawler Notification] Crawler notification mail. */ subject: [FESS] Crawler completed: /*pmb.hostname*/ >>> --- Server Info --- Host Name: /*pmb.hostname:orElse('Unknown')*/ Job Name: /*pmb.jobname:orElse('Unknown')*/ --- Web/FileSystem Crawler --- Start Time: /*pmb.webFsCrawlStartTime:orElse('-')*/ End Time: /*pmb.webFsCrawlEndTime:orElse('-')*/ Exec Time: /*pmb.webFsCrawlExecTime:orElse('-')*/ ms --- Web/FileSystem Indexer ---Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Wed Jan 15 22:05:20 GMT 2020 - 1K bytes - Click Count (0) -
README.md
```java // Create multiple crawler instances Crawler crawler1 = container.getComponent("crawler"); crawler1.setSessionId("session1"); crawler1.addUrl("https://site1.com"); Crawler crawler2 = container.getComponent("crawler"); crawler2.setSessionId("session2"); crawler2.addUrl("https://site2.com"); // Execute concurrently crawler1.setBackground(true); crawler2.setBackground(true);
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Sun Aug 31 05:32:52 GMT 2025 - 15.3K bytes - Click Count (0) -
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/container/LastaCrawlerContainerTest.java
// Verify that multiple components can be retrieved final Crawler crawler1 = crawlerContainer.getComponent("crawler"); final Crawler crawler2 = crawlerContainer.getComponent("crawler"); // They should be different instances (prototype scope) assertNotNull(crawler1); assertNotNull(crawler2); } @Test public void test_isLastaCrawlerContainer() {Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Fri Jan 16 13:52:11 GMT 2026 - 2.7K bytes - Click Count (0) -
src/main/resources/fess_indices/fess_config.scheduled_job/scheduled_job.bulk
{"index":{"_index":"fess_config.scheduled_job","_id":"default_crawler"}} {"name":"Default Crawler","target":"all","cronExpression":"0 0 * * *","scriptType":"groovy","scriptData":"return container.getComponent(\"crawlJob\").logLevel(\"info\").gcLogging().execute(executor);","jobLogging":true,"crawler":true,"available":true,"sortOrder":1,"createdBy":"system","createdTime":0,"updatedBy":"system","updatedTime":0} {"index":{"_index":"fess_config.scheduled_job","_id":"suggest_indexer"}}Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Mar 26 02:24:08 GMT 2026 - 5K bytes - Click Count (0) -
fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
crawler1.getCrawlerContext().setMaxAccessCount(maxCount); crawler1.getCrawlerContext().setNumOfThread(numOfThread); final Crawler crawler2 = getComponent(Crawler.class); crawler2.setBackground(true); ((UrlFilterImpl) crawler2.urlFilter).setIncludeFilteringPattern("$1$2$3.*"); crawler2.addUrl(url2); crawler2.getCrawlerContext().setMaxAccessCount(maxCount);
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Jan 15 01:11:43 GMT 2026 - 7.8K bytes - Click Count (0) -
CLAUDE.md
**DI Config**: `fess-crawler-lasta/src/main/resources/` - `crawler.xml` (root), `crawler/client.xml`, `crawler/extractor.xml`, `crawler/rule.xml`, `crawler/transformer.xml`, `crawler/transformer_basic.xml` - `crawler/mimetype.xml`, `crawler/encoding.xml`, `crawler/robotstxt.xml`, `crawler/sitemaps.xml`
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Mar 12 03:39:20 GMT 2026 - 8.1K bytes - Click Count (0)