Search Options

Display Count
Sort
Preferred Language
Advanced Search

Results 1 - 10 of 41 for Crawling (0.04 seconds)

The search processing time has exceeded the limit. The displayed results may be partial.

  1. src/main/java/org/codelibs/fess/helper/CrawlingInfoHelper.java

        }
    
        /**
         * Stores crawling information and parameters for the specified session.
         * Creates a new crawling info record if none exists or if create flag is true.
         * Also stores any accumulated information parameters and clears the info map.
         *
         * @param sessionId the session ID for the crawling information
         * @param create if true, creates a new crawling info regardless of existing records
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Thu Aug 07 03:06:29 GMT 2025
    - 15.2K bytes
    - Click Count (0)
  2. src/main/java/org/codelibs/fess/exec/Crawler.java

     * <ul>
     * <li>Web crawling - crawls web sites and web content</li>
     * <li>File system crawling - crawls file systems and documents</li>
     * <li>Data store crawling - crawls databases and other data sources</li>
     * <li>Combined crawling - runs multiple crawling types simultaneously</li>
     * </ul>
     *
     * <p>Command line usage:
     * <pre>
     * java org.codelibs.fess.exec.Crawler [options...]
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Thu Mar 26 02:24:08 GMT 2026
    - 32.4K bytes
    - Click Count (0)
  3. src/main/java/org/codelibs/fess/helper/CrawlingConfigHelper.java

    import com.google.common.cache.Cache;
    import com.google.common.cache.CacheBuilder;
    
    import jakarta.annotation.PostConstruct;
    
    /**
     * Helper class for managing crawling configurations.
     * Provides functionality to store, retrieve, and manage different types of crawling configurations
     * including web, file, and data configurations. Supports caching and session-based configuration management.
     */
    public class CrawlingConfigHelper {
    
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 19.5K bytes
    - Click Count (1)
  4. src/main/java/org/codelibs/fess/app/service/CrawlingInfoService.java

        }
    
        /**
         * Stores (inserts or updates) a crawling information record.
         * Sets up the store conditions including creation time if not already set,
         * then performs an insert or update operation with immediate refresh.
         *
         * @param crawlingInfo the crawling information entity to store
         * @throws FessSystemException if the crawling information is null
         */
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Thu Jul 17 08:28:31 GMT 2025
    - 19.9K bytes
    - Click Count (0)
  5. src/main/java/org/codelibs/fess/helper/DataIndexHelper.java

    /**
     * Helper class for managing data crawling operations in Fess.
     * This class coordinates the execution of data store crawling processes,
     * managing multiple concurrent crawling threads and handling the indexing
     * of crawled documents into the search engine.
     *
     * <p>The DataIndexHelper supports:</p>
     * <ul>
     *   <li>Concurrent crawling of multiple data configurations</li>
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 19K bytes
    - Click Count (0)
  6. src/main/java/org/codelibs/fess/helper/WebFsIndexHelper.java

                if (logger.isInfoEnabled()) {
                    logger.info("No crawling target urls.");
                }
                return;
            }
    
            doCrawl(sessionId, webConfigList, fileConfigList);
        }
    
        /**
         * Performs the actual crawling operation for the provided configurations.
         *
         * @param sessionId The session ID for this crawling operation
         * @param webConfigList List of web configurations to crawl
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 25K bytes
    - Click Count (0)
  7. src/main/java/org/codelibs/fess/job/CrawlJob.java

        /**
         * The namespace identifier for the crawling session.
         * Used to organize and identify crawling activities in the system.
         * Defaults to the system crawling info name.
         */
        protected String namespace = Constants.CRAWLING_INFO_SYSTEM_NAME;
    
        /**
         * Array of web crawling configuration IDs to process.
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 19.6K bytes
    - Click Count (0)
  8. src/main/java/org/codelibs/fess/app/web/admin/wizard/AdminWizardAction.java

            return redirectWith(getClass(), moreUrl("crawlingConfigForm"));
        }
    
        /**
         * Creates a crawling configuration and proceeds to the start crawling form.
         *
         * @param form the form containing crawling configuration data
         * @return HTML response redirecting to the start crawling form
         */
        @Execute
        @Secured({ ROLE })
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Sat Jan 10 02:14:37 GMT 2026
    - 16.4K bytes
    - Click Count (0)
  9. src/main/java/org/codelibs/fess/app/web/admin/general/EditForm.java

        @Size(max = 10)
        public String thumbnail;
    
        /**
         * Types of crawling failures to ignore during crawling operations.
         * Specified failure types will not be logged or counted as errors.
         */
        @Size(max = 1000)
        public String ignoreFailureType;
    
        /**
         * Threshold for failure count before stopping crawling of a URL.
         * Set to -1 to disable the threshold check.
         */
        @Required
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Thu Mar 26 02:24:08 GMT 2026
    - 15.8K bytes
    - Click Count (0)
  10. src/main/java/org/codelibs/fess/ds/callback/FileListIndexUpdateCallbackImpl.java

        }
    
        /**
         * Adds a document to the search index by crawling the specified URL and processing the content.
         * This method handles recursive crawling with depth and access count limits, follows redirects,
         * and processes child URLs discovered during crawling.
         *
         * @param paramMap the data store parameters containing crawling configuration
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 29.7K bytes
    - Click Count (3)
Back to Top