Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 77 for crawler_ (0.06 sec)

  1. src/main/java/org/codelibs/fess/exec/Crawler.java

                if (logger.isDebugEnabled()) {
                    logger.debug("Crawler is stopped.", e);
                } else if (logger.isInfoEnabled()) {
                    logger.info("Crawler is stopped.");
                }
                exitCode = Constants.EXIT_FAIL;
            } catch (final Throwable t) {
                logger.error("Crawler does not work correctly.", t);
                exitCode = Constants.EXIT_FAIL;
            } finally {
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri Oct 11 21:20:39 UTC 2024
    - 24K bytes
    - Viewed (0)
  2. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                crawler1.getCrawlerContext().setMaxAccessCount(maxCount);
                crawler1.getCrawlerContext().setNumOfThread(numOfThread);
    
                Thread.sleep(100);
    
                final Crawler crawler2 = getComponent(Crawler.class);
                crawler2.setBackground(true);
                ((UrlFilterImpl) crawler2.urlFilter).setIncludeFilteringPattern("$1$2$3.*");
                crawler2.addUrl(url2);
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 7.7K bytes
    - Viewed (0)
  3. docs/de/README.md

    * [LastaFlute](https://github.com/lastaflute/lastaflute "LastaFlute"): Web-Framework
    * [Lasta Job](https://github.com/lastaflute/lasta-job "Lasta Job"): Job-Scheduler
    * [Fess Crawler](https://github.com/codelibs/fess-crawler "Fess Crawler"): Web-Crawler
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Sat Oct 12 07:19:47 UTC 2024
    - 7.6K bytes
    - Viewed (0)
  4. docs/fr/README.md

    * [LastaFlute](https://github.com/lastaflute/lastaflute "LastaFlute") : Framework Web
    * [Lasta Job](https://github.com/lastaflute/lasta-job "Lasta Job") : Planificateur de tâches
    * [Fess Crawler](https://github.com/codelibs/fess-crawler "Fess Crawler") : Crawler Web
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Sat Oct 12 07:19:47 UTC 2024
    - 7.9K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

    import org.codelibs.fess.crawler.client.CrawlerClientFactory;
    import org.codelibs.fess.crawler.container.CrawlerContainer;
    import org.codelibs.fess.crawler.entity.AccessResult;
    import org.codelibs.fess.crawler.entity.RequestData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.exception.ChildUrlsException;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sat Oct 12 01:41:37 UTC 2024
    - 15.5K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java

    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.container.CrawlerContainer;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    import org.codelibs.fess.crawler.exception.MaxLengthExceededException;
    import org.codelibs.fess.crawler.helper.ContentLengthHelper;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sat Oct 12 01:40:57 UTC 2024
    - 6.3K bytes
    - Viewed (0)
  7. fess-crawler-opensearch/src/main/resources/crawler_opensearch.xml

    <components namespace="fessCrawler">
        <include path="crawler/container.xml"/>
        <include path="crawler/client.xml"/>
        <include path="crawler/rule.xml"/>
        <include path="crawler/filter.xml"/>
        <include path="crawler/interval.xml"/>
        <include path="crawler/extractor.xml"/>
        <include path="crawler/mimetype.xml"/>
        <include path="crawler/encoding.xml"/>
        <include path="crawler/urlconverter.xml"/>
        <include path="crawler/log.xml"/>
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 2.2K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/helper/WebFsIndexHelper.java

    import org.codelibs.fess.Constants;
    import org.codelibs.fess.crawler.Crawler;
    import org.codelibs.fess.crawler.CrawlerContext;
    import org.codelibs.fess.crawler.CrawlerStatus;
    import org.codelibs.fess.crawler.interval.FessIntervalController;
    import org.codelibs.fess.crawler.service.impl.EsDataService;
    import org.codelibs.fess.crawler.service.impl.EsUrlFilterService;
    import org.codelibs.fess.crawler.service.impl.EsUrlQueueService;
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri Oct 11 21:11:58 UTC 2024
    - 22.6K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/UrlQueueImpl.java

        protected float weight = 1.0f;
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.entity.UrlQueue#getId()
         */
        @Override
        public IDTYPE getId() {
            return id;
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.entity.UrlQueue#setId(IDTYPE)
         */
        @Override
        public void setId(final IDTYPE id) {
            this.id = id;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Mon Nov 04 07:44:18 UTC 2024
    - 5.2K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/indexer/IndexUpdater.java

    import org.codelibs.fess.Constants;
    import org.codelibs.fess.crawler.Crawler;
    import org.codelibs.fess.crawler.entity.AccessResult;
    import org.codelibs.fess.crawler.entity.AccessResultData;
    import org.codelibs.fess.crawler.entity.EsAccessResult;
    import org.codelibs.fess.crawler.entity.EsUrlQueue;
    import org.codelibs.fess.crawler.service.DataService;
    import org.codelibs.fess.crawler.service.UrlFilterService;
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri Oct 11 21:20:39 UTC 2024
    - 24.2K bytes
    - Viewed (0)
Back to top