Search Options

Display Count
Sort
Preferred Language
Advanced Search

Results 31 - 40 of 311 for Crawler (0.06 seconds)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientFactory.java

     */
    package org.codelibs.fess.crawler.client;
    
    import java.util.LinkedHashMap;
    import java.util.List;
    import java.util.Map;
    import java.util.regex.Matcher;
    import java.util.regex.Pattern;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.container.CrawlerContainer;
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Mon Nov 24 03:59:47 GMT 2025
    - 7.3K bytes
    - Click Count (0)
  2. src/test/java/org/codelibs/fess/it/CrawlTestBase.java

            }
            if (1500 <= count) {
                logger.info("Time out: Failed to start crawler)");
                fail(); // Time Out
            }
    
            logger.info("Crawler is running");
            count = 0;
            isRunning = true;
            sleepTime = 100; // Reset to 100ms for termination wait
    
            // Wait until the crawler terminates (with exponential backoff)
            while (count < 3000 && isRunning) {
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Sun Jan 11 08:43:05 GMT 2026
    - 10.6K bytes
    - Click Count (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

    import org.codelibs.fess.crawler.client.CrawlerClientFactory;
    import org.codelibs.fess.crawler.container.CrawlerContainer;
    import org.codelibs.fess.crawler.entity.AccessResult;
    import org.codelibs.fess.crawler.entity.RequestData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.exception.ChildUrlsException;
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Wed Dec 31 09:07:38 GMT 2025
    - 20.3K bytes
    - Click Count (0)
  4. fess-crawler-lasta/src/main/resources/crawler/client.xml

    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<include path="crawler/robotstxt.xml" />
    	<include path="crawler/contentlength.xml" />
    	<include path="crawler/mimetype.xml" />
    
    	<!-- HC5 (Default) -->
    	<component name="internalHttpClient" class="org.codelibs.fess.crawler.client.http.Hc5HttpClient"
    		instance="prototype">
    		<property name="connectionTimeout">15000</property>
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Thu Jan 08 04:17:06 GMT 2026
    - 3.7K bytes
    - Click Count (0)
  5. src/main/java/org/codelibs/fess/crawler/util/FessCrawlerConfig.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.util;
    
    import org.codelibs.fess.util.ComponentUtil;
    
    /**
     * Fess-specific crawler configuration that extends OpenSearchCrawlerConfig.
     * This class provides configuration settings for the Fess crawler including
     * index names, shard counts, and replica counts for queue, data, and filter indices.
     */
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Thu Jul 17 08:28:31 GMT 2025
    - 3.5K bytes
    - Click Count (0)
  6. fess-crawler-opensearch/pom.xml

    	<modelVersion>4.0.0</modelVersion>
    	<artifactId>fess-crawler-opensearch</artifactId>
    	<packaging>jar</packaging>
    	<name>Fess Crawler OpenSearch</name>
    	<parent>
    		<groupId>org.codelibs.fess</groupId>
    		<artifactId>fess-crawler-parent</artifactId>
    		<version>15.6.0-SNAPSHOT</version>
    		<relativePath>../pom.xml</relativePath>
    	</parent>
    	<build>
    		<plugins>
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Thu Mar 05 23:30:42 GMT 2026
    - 3.9K bytes
    - Click Count (0)
  7. src/main/java/org/codelibs/fess/crawler/service/FessUrlQueueService.java

     */
    package org.codelibs.fess.crawler.service;
    
    import java.util.List;
    import java.util.Map;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.entity.OpenSearchUrlQueue;
    import org.codelibs.fess.crawler.service.impl.OpenSearchUrlQueueService;
    import org.codelibs.fess.crawler.util.OpenSearchCrawlerConfig;
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Thu Jul 17 08:28:31 GMT 2025
    - 4K bytes
    - Click Count (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClient.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.client;
    
    import java.util.Map;
    
    import org.codelibs.fess.crawler.entity.RequestData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    
    /**
     * Interface representing a client for a web crawler.
     * This client is responsible for executing requests and handling responses.
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Sat Mar 15 06:52:00 GMT 2025
    - 1.8K bytes
    - Click Count (0)
  9. src/main/java/org/codelibs/fess/Constants.java

        public static final String CRAWLER_START_TIME = "CrawlerStartTime";
    
        /** Info map key for crawler end time. */
        public static final String CRAWLER_END_TIME = "CrawlerEndTime";
    
        /** Info map key for crawler execution time. */
        public static final String CRAWLER_EXEC_TIME = "CrawlerExecTime";
    
        /** Info map key for web/file system crawler start time. */
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Sat Mar 28 11:55:54 GMT 2026
    - 35.8K bytes
    - Click Count (0)
  10. src/main/resources/crawler/rule.xml

    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<include path="crawler/transformer.xml" />
    
    	<component name="ruleManager" class="org.codelibs.fess.crawler.rule.impl.RuleManagerImpl" instance="prototype">
    		<postConstruct name="addRule">
    			<arg>sitemapsRule</arg>
    		</postConstruct>
    		<postConstruct name="addRule">
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Sun Mar 29 08:21:02 GMT 2026
    - 4.6K bytes
    - Click Count (0)
Back to Top