Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 34 for Crawling (0.06 sec)

  1. src/main/java/org/codelibs/fess/helper/CrawlingInfoHelper.java

        }
    
        /**
         * Stores crawling information and parameters for the specified session.
         * Creates a new crawling info record if none exists or if create flag is true.
         * Also stores any accumulated information parameters and clears the info map.
         *
         * @param sessionId the session ID for the crawling information
         * @param create if true, creates a new crawling info regardless of existing records
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 15.2K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/exec/Crawler.java

     * <ul>
     * <li>Web crawling - crawls web sites and web content</li>
     * <li>File system crawling - crawls file systems and documents</li>
     * <li>Data store crawling - crawls databases and other data sources</li>
     * <li>Combined crawling - runs multiple crawling types simultaneously</li>
     * </ul>
     *
     * <p>Command line usage:
     * <pre>
     * java org.codelibs.fess.exec.Crawler [options...]
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 31K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/helper/DataIndexHelper.java

    /**
     * Helper class for managing data crawling operations in Fess.
     * This class coordinates the execution of data store crawling processes,
     * managing multiple concurrent crawling threads and handling the indexing
     * of crawled documents into the search engine.
     *
     * <p>The DataIndexHelper supports:</p>
     * <ul>
     *   <li>Concurrent crawling of multiple data configurations</li>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 18.9K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/app/web/api/admin/crawlinginfo/ApiAdminCrawlinginfoAction.java

                    .status(ApiResult.Status.OK)
                    .result());
        }
    
        /**
         * Retrieves a specific crawling info log by ID.
         *
         * @param id the ID of the crawling info log to retrieve
         * @return JSON response containing the crawling info log data
         */
        // GET /api/admin/crawlinginfo/log/{id}
        @Execute
        public JsonResponse<ApiResult> get$log(final String id) {
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 6.1K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/util/GsaConfigParser.java

    /**
     * Parser for Google Search Appliance (GSA) configuration files.
     * This SAX-based parser reads GSA XML configuration files and converts them into
     * Fess configuration objects including web crawling configurations, file crawling
     * configurations, and label types for access control.
     *
     * <p>The parser handles the following GSA configuration elements:
     * <ul>
     * <li>Collections with good/bad URL patterns</li>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 21.5K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/ds/callback/FileListIndexUpdateCallbackImpl.java

        }
    
        /**
         * Adds a document to the search index by crawling the specified URL and processing the content.
         * This method handles recursive crawling with depth and access count limits, follows redirects,
         * and processes child URLs discovered during crawling.
         *
         * @param paramMap the data store parameters containing crawling configuration
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 28.9K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/app/web/admin/crawlinginfo/AdminCrawlinginfoAction.java

    import org.lastaflute.web.response.HtmlResponse;
    import org.lastaflute.web.response.render.RenderData;
    import org.lastaflute.web.ruts.process.ActionRuntime;
    
    import jakarta.annotation.Resource;
    
    /**
     * Admin action for Crawling Info management.
     *
     */
    public class AdminCrawlinginfoAction extends FessAdminAction {
    
        /**
         * Default constructor.
         */
        public AdminCrawlinginfoAction() {
            super();
        }
    
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 11.4K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/helper/DocumentHelper.java

            }
        }
    
        /**
         * Processes a crawling request for a specific URL.
         * Executes the full crawling pipeline including client execution, rule processing,
         * transformation, and data extraction.
         *
         * @param crawlingConfig the crawling configuration to use
         * @param crawlingInfoId the crawling session ID
         * @param url the URL to process
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 17.2K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java

     * This class extends the base CrawlerThread and provides Fess-specific functionality for
     * crawling and indexing documents, including incremental crawling capabilities, content
     * modification checking, and integration with the Fess search engine backend.
     *
     * <p>Key features include:</p>
     * <ul>
     * <li>Incremental crawling support with last-modified timestamp checking</li>
     * <li>Document expiration handling</li>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  10. src/test/java/org/codelibs/fess/job/PurgeLogJobTest.java

            ComponentUtil.register(systemHelper, "systemHelper");
            ComponentUtil.setFessConfig(fessConfig);
    
            // Execute
            String result = purgeLogJob.execute();
    
            // Assert crawling info and status update were called
            assertTrue(deleteCrawlingInfoCalled[0]);
            assertTrue(updateJobLogStatusCalled[0]);
    
            // Assert other services were not called
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Tue Aug 19 14:09:36 UTC 2025
    - 32.5K bytes
    - Viewed (0)
Back to top