Search Options

Results per page
Sort
Preferred Languages
Advance

Results 41 - 50 of 524 for crawling (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CrawlingParameterUtil.java

    import org.codelibs.fess.crawler.service.DataService;
    import org.codelibs.fess.crawler.service.UrlQueueService;
    
    /**
     * Utility class for managing crawling parameters using ThreadLocal variables.
     * This class provides methods to set and get various parameters related to the crawling process.
     *
     * <p>This class is final and cannot be instantiated.</p>
     *
     * <p>The following parameters are managed:</p>
     * <ul>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.4K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/app/web/admin/crawlinginfo/AdminCrawlinginfoAction.java

    import org.lastaflute.web.response.HtmlResponse;
    import org.lastaflute.web.response.render.RenderData;
    import org.lastaflute.web.ruts.process.ActionRuntime;
    
    import jakarta.annotation.Resource;
    
    /**
     * Admin action for Crawling Info management.
     *
     */
    public class AdminCrawlinginfoAction extends FessAdminAction {
    
        /**
         * Default constructor.
         */
        public AdminCrawlinginfoAction() {
            super();
        }
    
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 11.4K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/helper/DocumentHelper.java

            }
        }
    
        /**
         * Processes a crawling request for a specific URL.
         * Executes the full crawling pipeline including client execution, rule processing,
         * transformation, and data extraction.
         *
         * @param crawlingConfig the crawling configuration to use
         * @param crawlingInfoId the crawling session ID
         * @param url the URL to process
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 17.2K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/util/GsaConfigParser.java

    /**
     * Parser for Google Search Appliance (GSA) configuration files.
     * This SAX-based parser reads GSA XML configuration files and converts them into
     * Fess configuration objects including web crawling configurations, file crawling
     * configurations, and label types for access control.
     *
     * <p>The parser handles the following GSA configuration elements:
     * <ul>
     * <li>Collections with good/bad URL patterns</li>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 21.5K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java

     * This class extends the base CrawlerThread and provides Fess-specific functionality for
     * crawling and indexing documents, including incremental crawling capabilities, content
     * modification checking, and integration with the Fess search engine backend.
     *
     * <p>Key features include:</p>
     * <ul>
     * <li>Incremental crawling support with last-modified timestamp checking</li>
     * <li>Document expiration handling</li>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/app/service/FailureUrlService.java

    import org.dbflute.optional.OptionalEntity;
    
    import jakarta.annotation.Resource;
    
    /**
     * Service class for managing failure URLs that occur during web crawling.
     * Provides functionality to store, retrieve, and manage failed crawling attempts
     * with their associated error information.
     */
    public class FailureUrlService {
    
        /** Logger instance for this class */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RequestData.java

    import java.util.Objects;
    
    import org.codelibs.fess.crawler.Constants;
    
    /**
     * Represents a request data for crawling.
     * This class encapsulates the HTTP method, URL, and weight associated with a crawling request.
     */
    public class RequestData {
        /**
         * HTTP methods supported for crawling requests.
         */
        public enum Method {
            /** HTTP GET method. */
            GET,
            /** HTTP POST method. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/app/web/api/admin/crawlinginfo/EditBody.java

    import org.codelibs.fess.app.web.admin.crawlinginfo.EditForm;
    
    /**
     * Request body class for crawling info edit operations in the admin REST API.
     * This class extends EditForm to inherit the necessary form validation and binding capabilities
     * for crawling information management operations.
     */
    public class EditBody extends EditForm {
    
        /**
         * Default constructor.
         */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 1.1K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/app/pager/FileConfigPager.java

        /** Configuration name */
        public String name;
    
        /** File system paths to crawl */
        public String paths;
    
        /** Number of threads for crawling */
        public String numOfThread;
    
        /** Interval time between crawling operations */
        public String intervalTime;
    
        /** Boost value for search ranking */
        public String boost;
    
        /** Availability status of the configuration */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 7.3K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/crawler/transformer/FessXpathTransformer.java

                putResultDataBody(dataMap, fessConfig.getIndexFieldContent(), content);
            }
        }
    
        /**
         * Retrieves the crawling configuration for the given response data.
         *
         * @param responseData the response data from crawling
         * @return the crawling configuration
         */
        protected CrawlingConfig getCrawlingConfig(final ResponseData responseData) {
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 54.4K bytes
    - Viewed (0)
Back to top