Search Options

Results per page
Sort
Preferred Languages
Advance

Results 31 - 40 of 445 for crawler_ (0.04 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java

         * Please note that the value of this tag is considered a hint and not a
         * command. Even though search engine crawlers may consider this information
         * when making decisions, they may crawl pages marked "hourly" less
         * frequently than that, and they may crawl pages marked "yearly" more
         * frequently than that. Crawlers may periodically crawl pages marked
         * "never" so that they can handle unexpected changes to those pages.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  2. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueService.java

    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.AccessResult;
    import org.codelibs.fess.crawler.entity.OpenSearchUrlQueue;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.exception.OpenSearchAccessException;
    import org.codelibs.fess.crawler.service.UrlQueueService;
    import org.codelibs.fess.crawler.util.OpenSearchCrawlerConfig;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 17K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/log/LogType.java

        /** Indicates a general exception during crawling. */
        CRAWLING_EXCEPTION,
        /** Indicates no URL is available in the queue. */
        NO_URL_IN_QUEUE,
        /** Indicates the start of a crawler thread. */
        START_THREAD,
        /** Indicates the finish of a crawler thread. */
        FINISHED_THREAD,
        /** Indicates no response processor is available. */
        NO_RESPONSE_PROCESSOR,
        /** Indicates no rule is available for processing. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.4K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/helper/WebFsIndexHelper.java

    import org.codelibs.fess.Constants;
    import org.codelibs.fess.crawler.Crawler;
    import org.codelibs.fess.crawler.CrawlerContext;
    import org.codelibs.fess.crawler.CrawlerStatus;
    import org.codelibs.fess.crawler.interval.FessIntervalController;
    import org.codelibs.fess.crawler.service.impl.OpenSearchDataService;
    import org.codelibs.fess.crawler.service.impl.OpenSearchUrlFilterService;
    import org.codelibs.fess.crawler.service.impl.OpenSearchUrlQueueService;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 24.9K bytes
    - Viewed (0)
  5. docs/de/README.md

    * [LastaFlute](https://github.com/lastaflute/lastaflute "LastaFlute"): Web-Framework
    * [Lasta Job](https://github.com/lastaflute/lasta-job "Lasta Job"): Job-Scheduler
    * [Fess Crawler](https://github.com/codelibs/fess-crawler "Fess Crawler"): Web-Crawler
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sat Oct 12 07:19:47 UTC 2024
    - 7.6K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/crawler/transformer/FessTransformer.java

    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.Constants;
    import org.codelibs.fess.crawler.entity.AccessResult;
    import org.codelibs.fess.crawler.entity.AccessResultData;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.util.CrawlingParameterUtil;
    import org.codelibs.fess.crawler.util.FieldConfigs;
    import org.codelibs.fess.mylasta.direction.FessConfig;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 13.8K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/app/web/admin/wizard/AdminWizardAction.java

        protected DynamicProperties systemProperties;
    
        /** Service for managing web crawler configurations */
        @Resource
        protected WebConfigService webConfigService;
    
        /** Service for managing file crawler configurations */
        @Resource
        protected FileConfigService fileConfigService;
    
        /** Helper for managing crawler processes */
        @Resource
        protected ProcessHelper processHelper;
    
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 15.8K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/app/web/admin/webconfig/CreateForm.java

         * Document URL patterns to exclude from search index.
         */
        @CustomSize(maxKey = "form.admin.max.input.size")
        public String excludedDocUrls;
    
        /**
         * Additional configuration parameters for the crawler.
         */
        @CustomSize(maxKey = "form.admin.max.input.size")
        public String configParameter;
    
        /**
         * The maximum crawling depth from the starting URLs.
         */
        @Min(value = 0)
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 5.9K bytes
    - Viewed (0)
  9. docs/fr/README.md

    * [LastaFlute](https://github.com/lastaflute/lastaflute "LastaFlute") : Framework Web
    * [Lasta Job](https://github.com/lastaflute/lasta-job "Lasta Job") : Planificateur de tâches
    * [Fess Crawler](https://github.com/codelibs/fess-crawler "Fess Crawler") : Crawler Web
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sat Oct 12 07:19:47 UTC 2024
    - 7.9K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ResponseData.java

    import java.util.Map;
    import java.util.Set;
    
    import org.codelibs.core.exception.IORuntimeException;
    import org.codelibs.core.io.FileUtil;
    import org.codelibs.fess.crawler.Constants;
    
    /**
     * Represents the response data obtained from a crawled resource.
     * This class encapsulates various details of an HTTP response, including
     * status code, content type, content length, and the response body.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 11.6K bytes
    - Viewed (0)
Back to top