Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 22 for defined (0.04 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/SitemapsRule.java

     * represents a valid sitemap. It uses a SitemapsHelper to validate the response body as an InputStream.
     * The rule checks if the URL matches the defined regex pattern and then validates the content as a sitemap.
     * If any exception occurs during the sitemap validation, it logs the error and returns false.
     *
     */
    public class SitemapsRule extends RegexRule {
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/AbstractRule.java

     * and provides getter and setter methods for common properties such as
     * {@code ruleId} and {@code responseProcessor}.
     * </p>
     *
     * <p>
     * Subclasses should extend this class and implement the abstract methods
     * defined in the {@link Rule} interface to provide specific rule logic.
     * </p>
     *
     */
    public abstract class AbstractRule implements Rule {
    
        private static final long serialVersionUID = 1L;
    
        /** The rule ID. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 2.8K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/suggest/settings/AnalyzerSettings.java

     *   <li>Loading index settings and mappings from resources.</li>
     *   <li>Checking the availability of analyzers for supported languages.</li>
     * </ul>
     *
     * <p>Supported languages are defined in the SUPPORTED_LANGUAGES array.</p>
     *
     * <p>Inner class:</p>
     * <ul>
     *   <li>DefaultContentsAnalyzer: Implements the SuggestAnalyzer interface to analyze text and retrieve tokens using
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 26.5K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImpl.java

     * The class supports caching of include and exclude patterns for scenarios where a session ID is not available.
     * It also provides methods to initialize the filter with a session ID, clear the filter,
     * match a URL against the defined patterns, and process a URL to add include or exclude patterns based on predefined filtering patterns.
     *
     */
    /**
     * This class is an implementation of a URL filter.
     */
    public class UrlFilterImpl implements UrlFilter {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/Constants.java

     * Constants used in the fess-crawler.
     * This class provides a collection of constant values for HTTP methods, status codes,
     * transformer names, boolean values, character encodings, date/time formats, and XML features.
     * It is designed to avoid the instantiation.
     */
    public final class Constants {
        /**
         * The GET method.
         */
        public static final String GET_METHOD = "GET";
    
        /**
         * The HEAD method.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.6K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java

    import org.xml.sax.InputSource;
    
    /**
     * {@link XpathTransformer} is a class that transforms HTML content into XML format based on XPath expressions.
     * It extracts data from an HTML document by applying XPath rules defined in {@link #fieldRuleMap}.
     * The extracted data is then formatted into an XML structure and stored in the {@link ResultData}.
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.1K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java

     */
    package org.codelibs.fess.crawler.entity;
    
    import org.codelibs.core.lang.StringUtil;
    
    /**
     * Represents a URL entry within a sitemap.
     *
     * <p>
     * This class encapsulates the properties of a URL as defined in the sitemap XML format,
     * including its location, last modification date, change frequency, and priority.
     * It implements the {@link Sitemap} interface.
     * </p>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

    import java.util.List;
    import java.util.Map;
    import java.util.regex.Pattern;
    
    import org.codelibs.core.lang.StringUtil;
    
    /**
     * Represents a robots.txt file parser and handler.
     * This class manages the rules defined in a robots.txt file, including user agent directives,
     * allowed/disallowed paths, crawl delays, and sitemap URLs.
     *
     * <p>The robots.txt protocol is implemented according to the standard specification,
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/ResponseProcessor.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.processor;
    
    import org.codelibs.fess.crawler.entity.ResponseData;
    
    /**
     * The ResponseProcessor interface defines a contract for processing response data.
     * Implementations of this interface are responsible for handling the response data
     * obtained during a crawling process.
     */
    public interface ResponseProcessor {
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/IntervalController.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.interval;
    
    /**
     * The {@code IntervalController} interface defines methods for controlling
     * the delay intervals in a web crawler. It includes constants representing
     * different types of processing states and a method to introduce a delay
     * based on the type of processing.
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.8K bytes
    - Viewed (0)
Back to top