- Sort Score
- Num 10 results
- Language All
Results 31 - 40 of 311 for Crawler (0.06 seconds)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientFactory.java
*/ package org.codelibs.fess.crawler.client; import java.util.LinkedHashMap; import java.util.List; import java.util.Map; import java.util.regex.Matcher; import java.util.regex.Pattern; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.crawler.container.CrawlerContainer;
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Mon Nov 24 03:59:47 GMT 2025 - 7.3K bytes - Click Count (0) -
src/test/java/org/codelibs/fess/it/CrawlTestBase.java
} if (1500 <= count) { logger.info("Time out: Failed to start crawler)"); fail(); // Time Out } logger.info("Crawler is running"); count = 0; isRunning = true; sleepTime = 100; // Reset to 100ms for termination wait // Wait until the crawler terminates (with exponential backoff) while (count < 3000 && isRunning) {Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Sun Jan 11 08:43:05 GMT 2026 - 10.6K bytes - Click Count (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java
import org.codelibs.fess.crawler.client.CrawlerClientFactory; import org.codelibs.fess.crawler.container.CrawlerContainer; import org.codelibs.fess.crawler.entity.AccessResult; import org.codelibs.fess.crawler.entity.RequestData; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.UrlQueue; import org.codelibs.fess.crawler.exception.ChildUrlsException;
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Wed Dec 31 09:07:38 GMT 2025 - 20.3K bytes - Click Count (0) -
fess-crawler-lasta/src/main/resources/crawler/client.xml
"http://dbflute.org/meta/lastadi10.dtd"> <components namespace="fessCrawler"> <include path="crawler/container.xml" /> <include path="crawler/robotstxt.xml" /> <include path="crawler/contentlength.xml" /> <include path="crawler/mimetype.xml" /> <!-- HC5 (Default) --> <component name="internalHttpClient" class="org.codelibs.fess.crawler.client.http.Hc5HttpClient" instance="prototype"> <property name="connectionTimeout">15000</property>
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Jan 08 04:17:06 GMT 2026 - 3.7K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/crawler/util/FessCrawlerConfig.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.util; import org.codelibs.fess.util.ComponentUtil; /** * Fess-specific crawler configuration that extends OpenSearchCrawlerConfig. * This class provides configuration settings for the Fess crawler including * index names, shard counts, and replica counts for queue, data, and filter indices. */
Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Jul 17 08:28:31 GMT 2025 - 3.5K bytes - Click Count (0) -
fess-crawler-opensearch/pom.xml
<modelVersion>4.0.0</modelVersion> <artifactId>fess-crawler-opensearch</artifactId> <packaging>jar</packaging> <name>Fess Crawler OpenSearch</name> <parent> <groupId>org.codelibs.fess</groupId> <artifactId>fess-crawler-parent</artifactId> <version>15.6.0-SNAPSHOT</version> <relativePath>../pom.xml</relativePath> </parent> <build> <plugins>
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Mar 05 23:30:42 GMT 2026 - 3.9K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/crawler/service/FessUrlQueueService.java
*/ package org.codelibs.fess.crawler.service; import java.util.List; import java.util.Map; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.fess.crawler.entity.OpenSearchUrlQueue; import org.codelibs.fess.crawler.service.impl.OpenSearchUrlQueueService; import org.codelibs.fess.crawler.util.OpenSearchCrawlerConfig;
Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Jul 17 08:28:31 GMT 2025 - 4K bytes - Click Count (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClient.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.client; import java.util.Map; import org.codelibs.fess.crawler.entity.RequestData; import org.codelibs.fess.crawler.entity.ResponseData; /** * Interface representing a client for a web crawler. * This client is responsible for executing requests and handling responses.
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Sat Mar 15 06:52:00 GMT 2025 - 1.8K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/Constants.java
public static final String CRAWLER_START_TIME = "CrawlerStartTime"; /** Info map key for crawler end time. */ public static final String CRAWLER_END_TIME = "CrawlerEndTime"; /** Info map key for crawler execution time. */ public static final String CRAWLER_EXEC_TIME = "CrawlerExecTime"; /** Info map key for web/file system crawler start time. */
Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Sat Mar 28 11:55:54 GMT 2026 - 35.8K bytes - Click Count (0) -
src/main/resources/crawler/rule.xml
<!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" "http://dbflute.org/meta/lastadi10.dtd"> <components namespace="fessCrawler"> <include path="crawler/container.xml" /> <include path="crawler/transformer.xml" /> <component name="ruleManager" class="org.codelibs.fess.crawler.rule.impl.RuleManagerImpl" instance="prototype"> <postConstruct name="addRule"> <arg>sitemapsRule</arg> </postConstruct> <postConstruct name="addRule">
Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Sun Mar 29 08:21:02 GMT 2026 - 4.6K bytes - Click Count (0)