Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 164 for Crawling (0.06 sec)

  1. src/main/java/org/codelibs/fess/app/web/admin/crawlinginfo/EditForm.java

        /**
         * The unique identifier of the crawling information entry being edited.
         * This is a required field for identifying which crawling info to update.
         */
        @Required
        @Size(max = 1000)
        public String id;
    
        /**
         * The session identifier of the crawling session.
         * This is a required field that identifies the specific crawling session.
         * Maximum length is 20 characters.
         */
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 2.7K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/exception/DataStoreCrawlingException.java

    /**
     * Exception thrown when an error occurs during data store crawling operations.
     * This exception provides information about the URL where the error occurred
     * and whether the crawling process should be aborted.
     */
    public class DataStoreCrawlingException extends CrawlingAccessException {
    
        private static final long serialVersionUID = 1L;
    
        /**
         * The URL where the crawling error occurred.
         */
        private final String url;
    
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Wed Nov 19 08:04:23 UTC 2025
    - 2.7K bytes
    - Viewed (0)
  3. README.md

            
            // Configure crawling parameters
            crawler.addUrl("https://example.com");
            crawler.crawlerContext.setMaxAccessCount(100);
            crawler.crawlerContext.setNumOfThread(5);
            crawler.urlFilter.addInclude("https://example.com/.*");
            
            // Execute crawling
            String sessionId = crawler.execute();
            System.out.println("Crawling completed. Session ID: " + sessionId);
        }
    }
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/LogHelperImpl.java

                logger.debug("Crawling access exception at url: {}", urlQueue.getUrl(), e);
            } else if (e.isInfoEnabled()) {
                logger.info(e.getMessage());
            } else if (e.isWarnEnabled()) {
                logger.warn("Crawling access exception at url: {}", urlQueue.getUrl(), e);
            } else if (e.isErrorEnabled()) {
                logger.error("Crawling access exception at url: {}", urlQueue.getUrl(), e);
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 02:01:26 UTC 2025
    - 14K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/app/service/CrawlingInfoService.java

        }
    
        /**
         * Stores (inserts or updates) a crawling information record.
         * Sets up the store conditions including creation time if not already set,
         * then performs an insert or update operation with immediate refresh.
         *
         * @param crawlingInfo the crawling information entity to store
         * @throws FessSystemException if the crawling information is null
         */
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 19.9K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/log/LogType.java

     * Each enum constant represents a specific event or state in the crawler's execution.
     */
    public enum LogType {
        /** Indicates the start of a crawling process. */
        START_CRAWLING,
        /** Indicates the cleanup phase of crawling. */
        CLEANUP_CRAWLING,
        /** Indicates an unsupported URL was encountered when crawling started. */
        UNSUPPORTED_URL_AT_CRAWLING_STARTED,
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.4K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/app/web/api/admin/crawlinginfo/ApiAdminCrawlinginfoAction.java

                    .status(ApiResult.Status.OK)
                    .result());
        }
    
        /**
         * Retrieves a specific crawling info log by ID.
         *
         * @param id the ID of the crawling info log to retrieve
         * @return JSON response containing the crawling info log data
         */
        // GET /api/admin/crawlinginfo/log/{id}
        @Execute
        public JsonResponse<ApiResult> get$log(final String id) {
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 6.1K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/helper/CrawlingInfoHelper.java

        }
    
        /**
         * Stores crawling information and parameters for the specified session.
         * Creates a new crawling info record if none exists or if create flag is true.
         * Also stores any accumulated information parameters and clears the info map.
         *
         * @param sessionId the session ID for the crawling information
         * @param create if true, creates a new crawling info regardless of existing records
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 15.2K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

    import org.codelibs.fess.crawler.service.UrlQueueService;
    
    import jakarta.annotation.Resource;
    
    /**
     * The Crawler class is the main class for web crawling. It manages the crawling process,
     * including adding URLs to the queue, filtering URLs, managing crawler threads,
     * and handling the overall crawling lifecycle.
     *
     * <p>It implements the Runnable interface to be executed in a separate thread,
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 17K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/helper/DataIndexHelper.java

    /**
     * Helper class for managing data crawling operations in Fess.
     * This class coordinates the execution of data store crawling processes,
     * managing multiple concurrent crawling threads and handling the indexing
     * of crawled documents into the search engine.
     *
     * <p>The DataIndexHelper supports:</p>
     * <ul>
     *   <li>Concurrent crawling of multiple data configurations</li>
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 19K bytes
    - Viewed (0)
Back to top