Search Options

Results per page
Sort
Preferred Languages
Advance

Results 61 - 70 of 524 for crawling (0.04 sec)

  1. README.md

    You can register crawling targets in the Admin UI on the (Web, File, Data Store) crawler configuration pages, and then start the Crawler manually on the [Scheduler page](https://fess.codelibs.org/15.0/admin/scheduler-guide.html).
    
    ## Migration from another search provider
    
    Please see [MIGRATION.md](MIGRATION.md).
    
    ## Data Store
    
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 10 06:34:32 UTC 2025
    - 7.2K bytes
    - Viewed (2)
  2. src/test/java/org/codelibs/fess/job/PurgeLogJobTest.java

            ComponentUtil.register(systemHelper, "systemHelper");
            ComponentUtil.setFessConfig(fessConfig);
    
            // Execute
            String result = purgeLogJob.execute();
    
            // Assert crawling info and status update were called
            assertTrue(deleteCrawlingInfoCalled[0]);
            assertTrue(updateJobLogStatusCalled[0]);
    
            // Assert other services were not called
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Tue Aug 19 14:09:36 UTC 2025
    - 32.5K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/app/web/admin/reqheader/EditForm.java

     * including tracking information for optimistic locking and audit trails.
     * Request headers are used to customize HTTP requests sent during web crawling operations.
     *
     */
    public class EditForm extends CreateForm {
    
        /**
         * Creates a new EditForm instance.
         */
        public EditForm() {
            super();
        }
    
        /**
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 2.4K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/app/service/WebConfigService.java

    import org.dbflute.optional.OptionalEntity;
    
    import jakarta.annotation.Resource;
    
    /**
     * Service class for managing web crawling configurations.
     * Provides CRUD operations for web configuration settings including
     * listing, retrieving, storing, and deleting web crawling configurations.
     */
    public class WebConfigService extends FessAppService {
    
        /**
         * Default constructor.
         */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 6.6K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/app/service/RequestHeaderService.java

    import org.dbflute.optional.OptionalEntity;
    
    import jakarta.annotation.Resource;
    
    /**
     * Service class for managing request headers used in web crawling configurations.
     * This service provides CRUD operations for request headers that are applied
     * during web crawling to configure HTTP request behavior.
     *
     */
    public class RequestHeaderService {
    
        /**
         * Behavior for request header database operations.
         */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 5.2K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/app/web/admin/duplicatehost/CreateForm.java

    import jakarta.validation.constraints.Size;
    
    /**
     * Form class for creating new duplicate host configuration entries.
     * This form handles the creation of duplicate host mappings that redirect
     * crawling from duplicate hostnames to the regular canonical hostname.
     */
    public class CreateForm {
    
        /**
         * Creates a new CreateForm instance.
         */
        public CreateForm() {
        }
    
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 2.5K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/app/web/admin/duplicatehost/EditForm.java

     * including tracking information for optimistic locking and audit trails.
     * Duplicate hosts are used to define which domains should be treated as the same site for crawling purposes.
     *
     */
    public class EditForm extends CreateForm {
    
        /**
         * Creates a new EditForm instance.
         */
        public EditForm() {
            super();
        }
    
        /**
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 2.4K bytes
    - Viewed (0)
  8. src/main/resources/fess_config.properties

    crawler.document.fullstop.chars=u002eu06d4u2e3cu3002
    # Encoding for crawling data.
    crawler.crawling.data.encoding=UTF-8
    # Supported web protocols for crawling.
    crawler.web.protocols=http,https
    # Supported file protocols for crawling.
    crawler.file.protocols=file,smb,smb1,ftp,storage
    # Pattern for environment variable keys in crawling data.
    crawler.data.env.param.key.pattern=^FESS_ENV_.*
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sat Jul 05 14:45:37 UTC 2025
    - 54.7K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/app/web/admin/scheduler/CreateForm.java

        /**
         * The script data or code for the scheduled job.
         */
        @CustomSize(maxKey = "form.admin.max.input.size")
        public String scriptData;
    
        /**
         * Whether this job is related to crawling.
         */
        public String crawler;
    
        /**
         * Whether job logging is enabled.
         */
        public String jobLogging;
    
        /**
         * Whether the scheduled job is available/enabled.
         */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 3.2K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/crawler/processor/FessResponseProcessor.java

     * This processor extends DefaultResponseProcessor to provide additional
     * processing capabilities through the ingest framework, allowing for
     * custom data transformation and enrichment during the crawling process.
     *
     * <p>It supports pluggable ingesters that can modify the result data
     * before it is stored in the search index.</p>
     */
    public class FessResponseProcessor extends DefaultResponseProcessor {
        /**
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 3.7K bytes
    - Viewed (0)
Back to top