Search Options

Results per page
Sort
Preferred Languages
Advance

Results 41 - 50 of 86 for provided (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java

    /**
     * {@link HtmlXpathExtractor} is an implementation of the {@link org.codelibs.fess.crawler.extractor.Extractor} interface.
     * It uses XPath expressions to extract text content from HTML documents.
     * <p>
     * This class provides methods to configure the XPath expressions, parser features, and properties.
     * It also includes caching mechanism for XPathAPI instances to improve performance.
     * </p>
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/Extractor.java

    import java.util.Map;
    
    import org.codelibs.fess.crawler.entity.ExtractData;
    
    /**
     * The Extractor interface defines methods for extracting text data from an input stream.
     * Implementations of this interface should provide the logic for extracting text and
     * optionally override the default weight value.
     */
    public interface Extractor {
    
        /**
         * Extracts text data from the given input stream.
         *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.6K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/UrlFilterServiceImpl.java

    import org.codelibs.fess.crawler.service.UrlFilterService;
    
    import jakarta.annotation.Resource;
    
    /**
     * Implementation of the {@link UrlFilterService} interface.
     * This class provides methods for managing URL filtering rules,
     * including adding include and exclude URL patterns, deleting patterns,
     * and retrieving lists of compiled URL patterns. It utilizes a
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/AbstractIntervalController.java

    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.interval.IntervalController;
    
    /**
     * An abstract base class for implementing {@link IntervalController}.
     * Provides a common structure for handling delays at different stages of the crawling process.
     * It encapsulates the delay logic and exception handling, allowing subclasses to focus on
     * defining the specific delay behavior for each stage.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/RobotsTxtException.java

     */
    package org.codelibs.fess.crawler.exception;
    
    /**
     * RobotsTxtException is an exception class that represents an error related to robots.txt processing during web crawling.
     * It extends CrawlerSystemException and provides constructors to create instances with a message and/or a cause.
     *
     */
    public class RobotsTxtException extends CrawlerSystemException {
    
        private static final long serialVersionUID = 1L;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.5K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/TextTransformer.java

     * It also provides a method to retrieve the extracted data as a String from an AccessResultData object.
     *
     * <p>
     * The class handles character encoding issues by attempting to use the specified charset.
     * If the specified charset is invalid, it falls back to UTF-8.
     * </p>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/MultipleCrawlingAccessException.java

    /**
     * An exception that indicates multiple crawling access exceptions occurred.
     * This exception holds an array of Throwable objects representing the individual causes.
     * It extends CrawlingAccessException and provides methods to print the stack traces of all causes.
     *
     */
    public class MultipleCrawlingAccessException extends CrawlingAccessException {
    
        private static final long serialVersionUID = 1L;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.5K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/DataServiceImpl.java

    import org.codelibs.fess.crawler.util.AccessResultCallback;
    
    import jakarta.annotation.Resource;
    
    /**
     * Implementation of the {@link DataService} interface for managing access result data.
     * This class provides methods to store, retrieve, update, and delete access results,
     * as well as to iterate over them. It uses a {@link MemoryDataHelper} to store the data in memory.
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.8K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/SitemapsException.java

     */
    package org.codelibs.fess.crawler.exception;
    
    /**
     * Exception thrown during sitemaps processing in the crawler.
     * This exception extends {@link org.codelibs.fess.crawler.exception.CrawlerSystemException}
     * and provides constructors for wrapping other exceptions or creating a new exception with a message.
     */
    public class SitemapsException extends CrawlerSystemException {
        private static final long serialVersionUID = 1L;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.7K bytes
    - Viewed (0)
  10. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/util/OpenSearchCrawlerConfig.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.util;
    
    /**
     * Configuration class for OpenSearch crawler settings.
     * This class provides configuration for index names, shards, and replicas
     * for the queue, data, and filter indices used by the crawler.
     */
    public class OpenSearchCrawlerConfig {
        /**
         * Constructs a new OpenSearchCrawlerConfig.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5.4K bytes
    - Viewed (10)
Back to top