Search Options

Results per page
Sort
Preferred Languages
Advance

Results 31 - 40 of 524 for crawling (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

     *   <li>Handling exceptions that may occur during the crawling process.</li>
     * </ol>
     *
     * <p>
     * The thread also manages the active thread count using {@code crawlerContext.activeThreadCountLock}
     * and provides methods for logging messages using {@link LogHelper}.
     * </p>
     *
     * <p>
     * The crawling process continues until the crawler status is {@link CrawlerStatus#DONE} or the
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/app/pager/CrawlingInfoPager.java

        private int currentPageNumber;
    
        /**
         * Crawling information ID.
         */
        public String id;
    
        /**
         * Session ID for the crawling session.
         */
        public String sessionId;
    
        /**
         * Creation time of the crawling information.
         */
        public String createdTime;
    
        /**
         * Clears all pagination state and crawling information fields.
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 6.9K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/ds/callback/FileListIndexUpdateCallbackImpl.java

        }
    
        /**
         * Adds a document to the search index by crawling the specified URL and processing the content.
         * This method handles recursive crawling with depth and access count limits, follows redirects,
         * and processes child URLs discovered during crawling.
         *
         * @param paramMap the data store parameters containing crawling configuration
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 28.9K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/app/web/admin/webconfig/CreateForm.java

        @CustomSize(maxKey = "form.admin.max.input.size")
        public String urls;
    
        /**
         * URL patterns to include during crawling.
         */
        @CustomSize(maxKey = "form.admin.max.input.size")
        public String includedUrls;
    
        /**
         * URL patterns to exclude during crawling.
         */
        @CustomSize(maxKey = "form.admin.max.input.size")
        public String excludedUrls;
    
        /**
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 5.9K bytes
    - Viewed (0)
  5. src/main/resources/fess_label.properties

    labels.createdTime=Created Time
    labels.depth=Depth
    labels.excludedPaths=Excluded Paths for Crawling
    labels.excludedUrls=Excluded URLs for Crawling
    labels.excludedDocPaths=Excluded Paths for Searching
    labels.excludedDocUrls=Excluded URLs for Searching
    labels.hostname=Hostname
    labels.id=ID
    labels.includedPaths=Included Paths for Crawling
    labels.includedUrls=Included URLs for Crawling
    labels.includedDocPaths=Included Paths for Searching
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sat Jun 28 08:40:50 UTC 2025
    - 40.7K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java

        /**
         * Filter for URLs to control which URLs are processed.
         */
        protected UrlFilter urlFilter;
    
        /**
         * Manager for crawling rules and configurations.
         */
        protected RuleManager ruleManager;
    
        /**
         * Controller for managing crawling intervals and delays.
         */
        protected IntervalController intervalController;
    
        /**
         * Set of robots.txt URLs that have been processed.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.9K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/ingest/Ingester.java

            return ComponentUtil.getIngestFactory();
        }
    
        /**
         * Processes a result data object for web/file crawling.
         * Default implementation returns the target unchanged.
         *
         * @param target the result data to process
         * @param responseData the response data from crawling
         * @return the processed result data
         */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 4.1K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/job/PurgeLogJob.java

            final StringBuilder resultBuf = new StringBuilder();
    
            // purge crawling sessions
            try {
                crawlingInfoService.deleteBefore(systemHelper.getCurrentTimeAsLong());
            } catch (final Exception e) {
                logger.error("Failed to purge crawling sessions.", e);
                resultBuf.append(e.getMessage()).append("\n");
            }
    
            // purge search logs
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 4.6K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/app/web/api/admin/fileconfig/SearchBody.java

    import org.codelibs.fess.app.web.api.admin.BaseSearchBody;
    
    /**
     * Search request body for file crawling configuration administration API.
     */
    public class SearchBody extends BaseSearchBody {
    
        /**
         * Default constructor.
         */
        public SearchBody() {
            super();
        }
    
        /** Name of the file crawling configuration */
        public String name;
    
        /** File paths to crawl */
        public String paths;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 1.2K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/helper/CrawlerLogHelper.java

            }
    
            if (cae.isDebugEnabled()) {
                logger.debug("[{}] Crawling Access Exception at {}", failureUrlId, urlQueue.getUrl(), cae);
            } else if (cae.isInfoEnabled()) {
                logger.info("[{}] {}", failureUrlId, cae.getMessage());
            } else if (cae.isWarnEnabled()) {
                logger.warn("[{}] Crawling Access Exception at {}", failureUrlId, urlQueue.getUrl(), cae);
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 8.2K bytes
    - Viewed (0)
Back to top