Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 296 for crawler_ (0.04 sec)

  1. samples/crawler/src/main/java/okhttp3/sample/Crawler.java

        OkHttpClient client = new OkHttpClient.Builder()
            .cache(cache)
            .callTimeout(5, TimeUnit.SECONDS)
            .build();
    
        Crawler crawler = new Crawler(client, queueLimit, hostLimit);
        crawler.queue.add(HttpUrl.get(args[1]));
        crawler.parallelDrainQueue(threadCount);
      }
    Registered: Fri Sep 05 11:42:10 UTC 2025
    - Last Modified: Wed Jul 23 00:58:06 UTC 2025
    - 5K bytes
    - Viewed (0)
  2. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                crawler1.getCrawlerContext().setMaxAccessCount(maxCount);
                crawler1.getCrawlerContext().setNumOfThread(numOfThread);
    
                final Crawler crawler2 = getComponent(Crawler.class);
                crawler2.setBackground(true);
                ((UrlFilterImpl) crawler2.urlFilter).setIncludeFilteringPattern("$1$2$3.*");
                crawler2.addUrl(url2);
                crawler2.getCrawlerContext().setMaxAccessCount(maxCount);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  3. fess-crawler-lasta/src/main/resources/crawler.xml

    <components namespace="fessCrawler">
    	<include path="crawler/container.xml"/>
    	<include path="crawler/client.xml"/>
    	<include path="crawler/rule.xml"/>
    	<include path="crawler/filter.xml"/>
    	<include path="crawler/interval.xml"/>
    	<include path="crawler/extractor.xml"/>
    	<include path="crawler/mimetype.xml"/>
    	<include path="crawler/encoding.xml"/>
    	<include path="crawler/urlconverter.xml"/>
    	<include path="crawler/log.xml"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Tue Nov 28 13:40:25 UTC 2017
    - 1.7K bytes
    - Viewed (0)
  4. src/main/resources/mail/crawler.dfmail

    /*
     [Crawler Notification]
     Crawler notification mail.
    */
    subject: [FESS] Crawler completed: /*pmb.hostname*/
    >>>
    --- Server Info ---
    Host Name: /*pmb.hostname:orElse('Unknown')*/
    Job Name: /*pmb.jobname:orElse('Unknown')*/
    
    --- Web/FileSystem Crawler ---
    Start Time: /*pmb.webFsCrawlStartTime:orElse('-')*/
    End Time:   /*pmb.webFsCrawlEndTime:orElse('-')*/
    Exec Time:  /*pmb.webFsCrawlExecTime:orElse('-')*/ ms
    
    --- Web/FileSystem Indexer ---
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Wed Jan 15 22:05:20 UTC 2020
    - 1K bytes
    - Viewed (0)
  5. src/main/resources/crawler_es+crawlerThread.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" 
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<!-- Crawler Thread -->
    	<component name="crawlerThread" class="org.codelibs.fess.crawler.FessCrawlerThread" instance="prototype" >
    	</component>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jan 28 04:42:09 UTC 2016
    - 342 bytes
    - Viewed (0)
  6. src/main/resources/crawler_es+urlQueueService.xml

    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" 
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<component name="urlQueueService"
    		class="org.codelibs.fess.crawler.service.FessUrlQueueService">
    		<arg>crawlerConfig</arg>
    	</component>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sun Nov 03 05:09:36 UTC 2024
    - 336 bytes
    - Viewed (0)
  7. src/main/resources/crawler_es+crawlerConfig.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" 
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<component name="crawlerConfig" class="org.codelibs.fess.crawler.util.FessCrawlerConfig">
    		<property name="queueIndex">"fess_crawler.queue"</property>
    		<property name="queueShards">5</property>
    		<property name="queueReplicas">1</property>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Fri Dec 03 13:06:40 UTC 2021
    - 756 bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapFile.java

         * Datetime format.
         *
         * By providing the last modification timestamp, you enable search engine
         * crawlers to retrieve only a subset of the Sitemaps in the index i.e. a
         * crawler may only retrieve Sitemaps that were modified since a certain
         * date. This incremental Sitemap fetching mechanism allows for the rapid
         * discovery of new URLs on very large sites.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.4K bytes
    - Viewed (1)
  9. src/main/java/org/codelibs/fess/crawler/processor/FessResponseProcessor.java

     */
    package org.codelibs.fess.crawler.processor;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.entity.AccessResult;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    import org.codelibs.fess.crawler.processor.impl.DefaultResponseProcessor;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 3.7K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java

     */
    package org.codelibs.fess.crawler;
    
    import java.util.Set;
    import java.util.concurrent.atomic.AtomicLong;
    
    import org.codelibs.core.collection.LruHashSet;
    import org.codelibs.fess.crawler.filter.UrlFilter;
    import org.codelibs.fess.crawler.interval.IntervalController;
    import org.codelibs.fess.crawler.rule.RuleManager;
    
    /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.9K bytes
    - Viewed (0)
Back to top