Search Options

Results per page
Sort
Preferred Languages
Advance

Results 31 - 40 of 133 for Crawling (2.02 sec)

  1. src/main/java/org/codelibs/fess/ingest/Ingester.java

            return ComponentUtil.getIngestFactory();
        }
    
        /**
         * Processes a result data object for web/file crawling.
         * Default implementation returns the target unchanged.
         *
         * @param target the result data to process
         * @param responseData the response data from crawling
         * @return the processed result data
         */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 4.1K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/job/PurgeLogJob.java

            final StringBuilder resultBuf = new StringBuilder();
    
            // purge crawling sessions
            try {
                crawlingInfoService.deleteBefore(systemHelper.getCurrentTimeAsLong());
            } catch (final Exception e) {
                logger.error("Failed to purge crawling sessions.", e);
                resultBuf.append(e.getMessage()).append("\n");
            }
    
            // purge search logs
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 4.6K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/helper/CrawlerLogHelper.java

            }
    
            if (cae.isDebugEnabled()) {
                logger.debug("[{}] Crawling Access Exception at {}", failureUrlId, urlQueue.getUrl(), cae);
            } else if (cae.isInfoEnabled()) {
                logger.info("[{}] {}", failureUrlId, cae.getMessage());
            } else if (cae.isWarnEnabled()) {
                logger.warn("[{}] Crawling Access Exception at {}", failureUrlId, urlQueue.getUrl(), cae);
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 8.2K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/app/web/admin/crawlinginfo/AdminCrawlinginfoAction.java

    import org.lastaflute.web.response.HtmlResponse;
    import org.lastaflute.web.response.render.RenderData;
    import org.lastaflute.web.ruts.process.ActionRuntime;
    
    import jakarta.annotation.Resource;
    
    /**
     * Admin action for Crawling Info management.
     *
     */
    public class AdminCrawlinginfoAction extends FessAdminAction {
    
        /**
         * Default constructor.
         */
        public AdminCrawlinginfoAction() {
            super();
        }
    
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 11.4K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/helper/DocumentHelper.java

            }
        }
    
        /**
         * Processes a crawling request for a specific URL.
         * Executes the full crawling pipeline including client execution, rule processing,
         * transformation, and data extraction.
         *
         * @param crawlingConfig the crawling configuration to use
         * @param crawlingInfoId the crawling session ID
         * @param url the URL to process
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 17.2K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/crawler/interval/FessIntervalController.java

    import org.codelibs.fess.util.ComponentUtil;
    
    /**
     * FessIntervalController extends DefaultIntervalController to provide
     * Fess-specific interval control functionality for web crawling operations.
     * This controller manages delays and timing for various crawling states
     * including processing delays, queue waiting times, and new URL discovery.
     */
    public class FessIntervalController extends DefaultIntervalController {
    
        /**
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 4.3K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/app/web/admin/general/MailForm.java

        /**
         * Default constructor.
         */
        public MailForm() {
            // Default constructor
        }
    
        /** The incremental crawling setting. */
        public String incrementalCrawling;
    
        /** The day for cleanup setting. */
        public String dayForCleanup;
    
        /** The crawling thread count setting. */
        public String crawlingThreadCount;
    
        /** The search log setting. */
        public String searchLog;
    
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java

     * This class extends the base CrawlerThread and provides Fess-specific functionality for
     * crawling and indexing documents, including incremental crawling capabilities, content
     * modification checking, and integration with the Fess search engine backend.
     *
     * <p>Key features include:</p>
     * <ul>
     * <li>Incremental crawling support with last-modified timestamp checking</li>
     * <li>Document expiration handling</li>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  9. src/test/java/org/codelibs/fess/job/PurgeLogJobTest.java

            ComponentUtil.register(systemHelper, "systemHelper");
            ComponentUtil.setFessConfig(fessConfig);
    
            // Execute
            String result = purgeLogJob.execute();
    
            // Assert crawling info and status update were called
            assertTrue(deleteCrawlingInfoCalled[0]);
            assertTrue(updateJobLogStatusCalled[0]);
    
            // Assert other services were not called
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Tue Aug 19 14:09:36 UTC 2025
    - 32.5K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/app/web/api/admin/crawlinginfo/EditBody.java

    import org.codelibs.fess.app.web.admin.crawlinginfo.EditForm;
    
    /**
     * Request body class for crawling info edit operations in the admin REST API.
     * This class extends EditForm to inherit the necessary form validation and binding capabilities
     * for crawling information management operations.
     */
    public class EditBody extends EditForm {
    
        /**
         * Default constructor.
         */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 1.1K bytes
    - Viewed (0)
Back to top