Search Options

Results per page
Sort
Preferred Languages
Advance

Results 41 - 50 of 167 for Crawling (0.14 sec)

  1. MIGRATION.md

    #### Migration Steps
    
    **Step 1: Set Up Fess Crawling**
    
    1. In Fess Admin, create a new Web crawling configuration
    2. Add your website URL as the starting point
    3. Configure crawl depth and URL patterns
    4. Start crawling
    
    **Step 2: Replace JavaScript Code**
    
    Replace existing GSS/CSE code:
    
    ```javascript
    <!-- Old GSS/CSE Code -->
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Nov 06 12:40:11 UTC 2025
    - 23.2K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/app/web/admin/crawlinginfo/AdminCrawlinginfoAction.java

    import org.lastaflute.web.response.HtmlResponse;
    import org.lastaflute.web.response.render.RenderData;
    import org.lastaflute.web.ruts.process.ActionRuntime;
    
    import jakarta.annotation.Resource;
    
    /**
     * Admin action for Crawling Info management.
     *
     */
    public class AdminCrawlinginfoAction extends FessAdminAction {
    
        /**
         * Default constructor.
         */
        public AdminCrawlinginfoAction() {
            super();
        }
    
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Nov 20 13:56:35 UTC 2025
    - 11K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/indexer/IndexUpdater.java

        public void setSessionIdList(final List<String> sessionIdList) {
            this.sessionIdList = sessionIdList;
        }
    
        /**
         * Sets the flag indicating whether crawling should be finished.
         *
         * @param finishCrawling true if crawling should be finished, false otherwise
         */
        public void setFinishCrawling(final boolean finishCrawling) {
            this.finishCrawling = finishCrawling;
        }
    
        /**
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 32.9K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/app/service/FailureUrlService.java

    import org.dbflute.optional.OptionalEntity;
    
    import jakarta.annotation.Resource;
    
    /**
     * Service class for managing failure URLs that occur during web crawling.
     * Provides functionality to store, retrieve, and manage failed crawling attempts
     * with their associated error information.
     */
    public class FailureUrlService {
    
        /** Logger instance for this class */
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  5. src/main/resources/fess_label_de.properties

    labels.depth=Tiefe
    labels.excludedPaths=Ausgeschlossene Pfade für das Crawling
    labels.excludedUrls=Ausgeschlossene URLs für das Crawling
    labels.excludedDocPaths=Ausgeschlossene Pfade für die Suche
    labels.excludedDocUrls=Ausgeschlossene URLs für die Suche
    labels.hostname=Hostname
    labels.id=ID
    labels.includedPaths=Eingeschlossene Pfade für das Crawling
    labels.includedUrls=Eingeschlossene URLs für das Crawling
    labels.includedDocPaths=Eingeschlossene Pfade für die Suche
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 13 02:21:17 UTC 2025
    - 46.9K bytes
    - Viewed (1)
  6. src/main/java/org/codelibs/fess/helper/DocumentHelper.java

            }
        }
    
        /**
         * Processes a crawling request for a specific URL.
         * Executes the full crawling pipeline including client execution, rule processing,
         * transformation, and data extraction.
         *
         * @param crawlingConfig the crawling configuration to use
         * @param crawlingInfoId the crawling session ID
         * @param url the URL to process
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 17.4K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RequestData.java

    import java.util.Objects;
    
    import org.codelibs.fess.crawler.Constants;
    
    /**
     * Represents a request data for crawling.
     * This class encapsulates the HTTP method, URL, and weight associated with a crawling request.
     */
    public class RequestData {
        /**
         * HTTP methods supported for crawling requests.
         */
        public enum Method {
            /** HTTP GET method. */
            GET,
            /** HTTP POST method. */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java

     * This class extends the base CrawlerThread and provides Fess-specific functionality for
     * crawling and indexing documents, including incremental crawling capabilities, content
     * modification checking, and integration with the Fess search engine backend.
     *
     * <p>Key features include:</p>
     * <ul>
     * <li>Incremental crawling support with last-modified timestamp checking</li>
     * <li>Document expiration handling</li>
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Dec 11 09:47:03 UTC 2025
    - 19.5K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/app/web/api/admin/crawlinginfo/EditBody.java

    import org.codelibs.fess.app.web.admin.crawlinginfo.EditForm;
    
    /**
     * Request body class for crawling info edit operations in the admin REST API.
     * This class extends EditForm to inherit the necessary form validation and binding capabilities
     * for crawling information management operations.
     */
    public class EditBody extends EditForm {
    
        /**
         * Default constructor.
         */
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 1.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/ResponseProcessor.java

    /**
     * The ResponseProcessor interface defines a contract for processing response data.
     * Implementations of this interface are responsible for handling the response data
     * obtained during a crawling process.
     */
    public interface ResponseProcessor {
    
        /**
         * Processes the given response data.
         *
         * @param responseData the response data to be processed
         */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.1K bytes
    - Viewed (0)
Back to top