Search Options

Results per page
Sort
Preferred Languages
Advance

Results 21 - 30 of 587 for crawling (0.75 sec)

  1. src/main/java/org/codelibs/fess/app/web/admin/crawlinginfo/SearchForm.java

     */
    package org.codelibs.fess.app.web.admin.crawlinginfo;
    
    /**
     * The search form for Crawling Info.
     */
    public class SearchForm {
    
        /**
         * Default constructor for SearchForm.
         */
        public SearchForm() {
        }
    
        /**
         * The session ID field for searching crawling information.
         */
        public String sessionId;
    
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 952 bytes
    - Viewed (0)
  2. CLAUDE.md

    - Graceful degradation (e.g., robots.txt parsing continues on errors)
    
    ---
    
    ## Key Components
    
    ### Crawler (`Crawler.java`)
    
    Main orchestrator for crawling operations.
    
    **Key Methods**:
    ```java
    String execute()                // Start crawling, return session ID
    void addUrl(String url)         // Add URL to queue
    void cleanup(String sessionId)  // Clean up session
    void stop()                     // Stop gracefully
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 28 17:31:34 UTC 2025
    - 10.7K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/app/web/admin/wizard/CrawlingConfigForm.java

    /**
     * Form class for crawling configuration wizard in the admin interface.
     * Contains validation constraints for creating new crawling configurations.
     */
    public class CrawlingConfigForm {
    
        /**
         * Creates a new form instance.
         */
        public CrawlingConfigForm() {
            // Default constructor
        }
    
        /**
         * Name of the crawling configuration.
         */
        @Required
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/Constants.java

        /** Property key for incremental crawling configuration. */
        public static final String INCREMENTAL_CRAWLING_PROPERTY = "crawling.incremental";
    
        /** Property key for crawling thread count configuration. */
        public static final String CRAWLING_THREAD_COUNT_PROPERTY = "crawling.thread.count";
    
        /** Property key for crawling user agent configuration. */
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 13 02:21:17 UTC 2025
    - 35.2K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/app/web/admin/failureurl/EditForm.java

        /**
         * The name of the web configuration associated with this failure URL.
         * Used to identify which web crawling configuration encountered the failure.
         */
        public String webConfigName;
    
        /**
         * The name of the file configuration associated with this failure URL.
         * Used to identify which file crawling configuration encountered the failure.
         */
        public String fileConfigName;
    
        /**
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/app/web/admin/wizard/StartCrawlingForm.java

     */
    package org.codelibs.fess.app.web.admin.wizard;
    
    /**
     * Form class for starting crawling operations in the admin wizard.
     *
     * This form is used to collect user input and parameters needed to initiate
     * crawling operations through the administrative interface wizard workflow.
     * It serves as a data transfer object between the web layer and the crawling
     * service components.
     */
    public class StartCrawlingForm {
    
        /**
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 1.1K bytes
    - Viewed (0)
  7. src/main/resources/fess_label.properties

    labels.createdTime=Created Time
    labels.depth=Depth
    labels.excludedPaths=Excluded Paths for Crawling
    labels.excludedUrls=Excluded URLs for Crawling
    labels.excludedDocPaths=Excluded Paths for Searching
    labels.excludedDocUrls=Excluded URLs for Searching
    labels.hostname=Hostname
    labels.id=ID
    labels.includedPaths=Included Paths for Crawling
    labels.includedUrls=Included URLs for Crawling
    labels.includedDocPaths=Included Paths for Searching
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 13 02:21:17 UTC 2025
    - 44K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/crawler/service/FessUrlQueueService.java

        }
    
        /**
         * Fetches URL queue list for the specified session with configurable ordering strategy.
         * Supports sequential (default) and random ordering based on crawling configuration.
         *
         * @param sessionId the crawling session identifier
         * @return list of URL queue entries for processing
         */
        @Override
        protected List<OpenSearchUrlQueue> fetchUrlQueueList(final String sessionId) {
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 4K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/AbstractIntervalController.java

                }
            }
        }
    
        /**
         * Delays the crawling process before processing a URL.
         */
        protected abstract void delayBeforeProcessing();
    
        /**
         * Delays the crawling process after processing a URL.
         */
        protected abstract void delayAfterProcessing();
    
        /**
         * Delays the crawling process when there are no URLs in the queue.
         */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 20 08:58:39 UTC 2025
    - 4.8K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/app/pager/CrawlingInfoPager.java

        private int currentPageNumber;
    
        /**
         * Crawling information ID.
         */
        public String id;
    
        /**
         * Session ID for the crawling session.
         */
        public String sessionId;
    
        /**
         * Creation time of the crawling information.
         */
        public String createdTime;
    
        /**
         * Clears all pagination state and crawling information fields.
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 6.9K bytes
    - Viewed (0)
Back to top