- Sort Score
- Num 10 results
- Language All
Results 1 - 10 of 278 for Crawler (0.07 seconds)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java
* * <p>Example usage: * <pre> * Crawler crawler = new Crawler(); * crawler.addUrl("http://example.com/"); * crawler.execute(); * crawler.close(); * </pre> */ public class Crawler implements Runnable, AutoCloseable { private static final Logger logger = LogManager.getLogger(Crawler.class); /** * Service for managing URL queues during crawling. */
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Mon Nov 24 03:59:47 GMT 2025 - 17K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/exec/Crawler.java
* </pre> */ public class Crawler { /** * Creates a new instance of Crawler. */ public Crawler() { // Default constructor } /** Logger instance for this class. */ private static final Logger logger = LogManager.getLogger(Crawler.class); /** Thread name for web and file system crawling process. */Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Mar 26 02:24:08 GMT 2026 - 32.4K bytes - Click Count (0) -
samples/crawler/src/main/java/okhttp3/sample/Crawler.java
OkHttpClient client = new OkHttpClient.Builder() .cache(cache) .callTimeout(5, TimeUnit.SECONDS) .build(); Crawler crawler = new Crawler(client, queueLimit, hostLimit); crawler.queue.add(HttpUrl.get(args[1])); crawler.parallelDrainQueue(threadCount); }
Created: Fri Apr 03 11:42:14 GMT 2026 - Last Modified: Wed Jul 23 00:58:06 GMT 2025 - 5K bytes - Click Count (0) -
README.md
```java // Create multiple crawler instances Crawler crawler1 = container.getComponent("crawler"); crawler1.setSessionId("session1"); crawler1.addUrl("https://site1.com"); Crawler crawler2 = container.getComponent("crawler"); crawler2.setSessionId("session2"); crawler2.addUrl("https://site2.com"); // Execute concurrently crawler1.setBackground(true); crawler2.setBackground(true);
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Sun Aug 31 05:32:52 GMT 2025 - 15.3K bytes - Click Count (0) -
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/container/LastaCrawlerContainerTest.java
// Verify that multiple components can be retrieved final Crawler crawler1 = crawlerContainer.getComponent("crawler"); final Crawler crawler2 = crawlerContainer.getComponent("crawler"); // They should be different instances (prototype scope) assertNotNull(crawler1); assertNotNull(crawler2); } @Test public void test_isLastaCrawlerContainer() {Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Fri Jan 16 13:52:11 GMT 2026 - 2.7K bytes - Click Count (0) -
src/main/resources/fess_indices/fess_config.scheduled_job/scheduled_job.bulk
{"index":{"_index":"fess_config.scheduled_job","_id":"default_crawler"}} {"name":"Default Crawler","target":"all","cronExpression":"0 0 * * *","scriptType":"groovy","scriptData":"return container.getComponent(\"crawlJob\").logLevel(\"info\").gcLogging().execute(executor);","jobLogging":true,"crawler":true,"available":true,"sortOrder":1,"createdBy":"system","createdTime":0,"updatedBy":"system","updatedTime":0} {"index":{"_index":"fess_config.scheduled_job","_id":"suggest_indexer"}}Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Mar 26 02:24:08 GMT 2026 - 5K bytes - Click Count (0) -
fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
crawler1.getCrawlerContext().setMaxAccessCount(maxCount); crawler1.getCrawlerContext().setNumOfThread(numOfThread); final Crawler crawler2 = getComponent(Crawler.class); crawler2.setBackground(true); ((UrlFilterImpl) crawler2.urlFilter).setIncludeFilteringPattern("$1$2$3.*"); crawler2.addUrl(url2); crawler2.getCrawlerContext().setMaxAccessCount(maxCount);
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Jan 15 01:11:43 GMT 2026 - 7.8K bytes - Click Count (0) -
CLAUDE.md
**DI Config**: `fess-crawler-lasta/src/main/resources/` - `crawler.xml` (root), `crawler/client.xml`, `crawler/extractor.xml`, `crawler/rule.xml`, `crawler/transformer.xml`, `crawler/transformer_basic.xml` - `crawler/mimetype.xml`, `crawler/encoding.xml`, `crawler/robotstxt.xml`, `crawler/sitemaps.xml`
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Mar 12 03:39:20 GMT 2026 - 8.1K bytes - Click Count (0) -
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
crawler1.addUrl(url1); crawler1.getCrawlerContext().setMaxAccessCount(maxCount); crawler1.getCrawlerContext().setNumOfThread(numOfThread); final Crawler crawler2 = crawlerContainer.getComponent("crawler"); crawler2.setSessionId(crawler2.getSessionId() + "2"); crawler2.setBackground(true);
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Jan 15 01:11:43 GMT 2026 - 13.1K bytes - Click Count (0) -
fess-crawler-opensearch/src/main/resources/crawler_opensearch.xml
<components namespace="fessCrawler"> <include path="crawler/container.xml"/> <include path="crawler/client.xml"/> <include path="crawler/rule.xml"/> <include path="crawler/filter.xml"/> <include path="crawler/interval.xml"/> <include path="crawler/extractor.xml"/> <include path="crawler/mimetype.xml"/> <include path="crawler/encoding.xml"/> <include path="crawler/urlconverter.xml"/> <include path="crawler/log.xml"/>
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Nov 07 04:44:10 GMT 2024 - 2.2K bytes - Click Count (0)