Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 168 for crawlen (0.08 sec)

  1. docs/de/README.md

    Sie können in der Administrationsoberfläche (Web, Datei, Datenspeicher) Crawling-Ziele in den Crawler-Konfigurationsseiten registrieren und den Crawler manuell auf der [Scheduler-Seite](https://fess.codelibs.org/14.17/admin/scheduler-guide.html) starten.
    
    ## Migration von einem anderen Suchanbieter
    
    Bitte lesen Sie [MIGRATION.md](MIGRATION.md).
    
    ## Datenspeicher
    
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sat Oct 12 07:19:47 UTC 2024
    - 7.6K bytes
    - Viewed (0)
  2. samples/crawler/src/main/java/okhttp3/sample/Crawler.java

        OkHttpClient client = new OkHttpClient.Builder()
            .cache(cache)
            .callTimeout(5, TimeUnit.SECONDS)
            .build();
    
        Crawler crawler = new Crawler(client, queueLimit, hostLimit);
        crawler.queue.add(HttpUrl.get(args[1]));
        crawler.parallelDrainQueue(threadCount);
      }
    Registered: Fri Sep 05 11:42:10 UTC 2025
    - Last Modified: Wed Jul 23 00:58:06 UTC 2025
    - 5K bytes
    - Viewed (0)
  3. src/main/resources/mail/crawler.dfmail

    /*
     [Crawler Notification]
     Crawler notification mail.
    */
    subject: [FESS] Crawler completed: /*pmb.hostname*/
    >>>
    --- Server Info ---
    Host Name: /*pmb.hostname:orElse('Unknown')*/
    Job Name: /*pmb.jobname:orElse('Unknown')*/
    
    --- Web/FileSystem Crawler ---
    Start Time: /*pmb.webFsCrawlStartTime:orElse('-')*/
    End Time:   /*pmb.webFsCrawlEndTime:orElse('-')*/
    Exec Time:  /*pmb.webFsCrawlExecTime:orElse('-')*/ ms
    
    --- Web/FileSystem Indexer ---
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Wed Jan 15 22:05:20 UTC 2020
    - 1K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/crawler/processor/FessResponseProcessor.java

     */
    package org.codelibs.fess.crawler.processor;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.entity.AccessResult;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    import org.codelibs.fess.crawler.processor.impl.DefaultResponseProcessor;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 3.7K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/crawler/service/FessUrlQueueService.java

     */
    package org.codelibs.fess.crawler.service;
    
    import java.util.List;
    import java.util.Map;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.entity.OpenSearchUrlQueue;
    import org.codelibs.fess.crawler.service.impl.OpenSearchUrlQueueService;
    import org.codelibs.fess.crawler.util.OpenSearchCrawlerConfig;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 4K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/app/web/admin/fileconfig/CreateForm.java

        /** Additional configuration parameters for the file crawler. */
        @CustomSize(maxKey = "form.admin.max.input.size")
        public String configParameter;
    
        /** The maximum crawling depth (0 to 2147483647, 0 means unlimited). */
        @Min(value = 0)
        @Max(value = 2147483647)
        @ValidateTypeFailure
        public Integer depth;
    
        /** The maximum number of documents to access during crawling (0 means unlimited). */
        @Min(value = 0)
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 5.6K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/app/web/admin/webconfig/CreateForm.java

         */
        @Min(value = 0)
        @Max(value = 9223372036854775807L)
        @ValidateTypeFailure
        public Long maxAccessCount;
    
        /**
         * The user agent string to use during crawling.
         */
        @Required
        @Size(max = 200)
        public String userAgent;
    
        /**
         * The number of crawler threads to use.
         */
        @Required
        @Min(value = 1)
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 5.9K bytes
    - Viewed (0)
  8. README.md

    * [LastaFlute](https://github.com/lastaflute/lastaflute "LastaFlute"): Web Framework
    * [Lasta Job](https://github.com/lastaflute/lasta-job "Lasta Job"): Job Scheduler
    * [Fess Crawler](https://github.com/codelibs/fess-crawler "Fess Crawler"): Web Crawler
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 10 06:34:32 UTC 2025
    - 7.2K bytes
    - Viewed (2)
  9. src/main/java/org/codelibs/fess/helper/CrawlerLogHelper.java

    import org.codelibs.fess.app.service.FailureUrlService;
    import org.codelibs.fess.crawler.CrawlerContext;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.codelibs.fess.crawler.exception.MultipleCrawlingAccessException;
    import org.codelibs.fess.crawler.helper.impl.LogHelperImpl;
    import org.codelibs.fess.crawler.log.LogType;
    import org.codelibs.fess.exception.ContainerNotAvailableException;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 8.2K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/app/pager/FileConfigPager.java

        /** Configuration ID */
        public String id;
    
        /** Configuration name */
        public String name;
    
        /** File system paths to crawl */
        public String paths;
    
        /** Number of threads for crawling */
        public String numOfThread;
    
        /** Interval time between crawling operations */
        public String intervalTime;
    
        /** Boost value for search ranking */
        public String boost;
    
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 7.3K bytes
    - Viewed (0)
Back to top