Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 55 for rule (0.02 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/RuleManager.java

         */
        /**
         * Adds a rule to the specified index.
         *
         * @param index the position at which the rule should be added
         * @param rule the rule to be added
         */
        void addRule(int index, Rule rule);
    
        /**
         * Removes the specified rule from the rule manager.
         *
         * @param rule the rule to be removed
         * @return true if the rule was successfully removed, false otherwise
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.1K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/SitemapsRule.java

     */
    package org.codelibs.fess.crawler.rule.impl;
    
    import java.io.InputStream;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.codelibs.fess.crawler.helper.SitemapsHelper;
    
    /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

         * Processes the response data using the appropriate rule processor.
         * @param urlQueue The URL queue entry.
         * @param responseData The response data to process.
         */
        protected void processResponse(final UrlQueue<?> urlQueue, final ResponseData responseData) {
            // get a rule
            final Rule rule = crawlerContext.ruleManager.getRule(responseData);
            if (rule == null) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java

            @Override
            public Rule getRule(ResponseData responseData) {
                return null;
            }
    
            @Override
            public void addRule(Rule rule) {
            }
    
            @Override
            public void addRule(int index, Rule rule) {
            }
    
            @Override
            public boolean removeRule(Rule rule) {
                return false;
            }
    
            @Override
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 25.6K bytes
    - Viewed (0)
  5. src/test/java/org/codelibs/opensearch/extension/kuromoji/index/analysis/KuromojiTokenizerFactory.java

            nBestExamples = settings.get(NBEST_EXAMPLES);
        }
    
        private static String parse(String rule, Set<String> dup) {
            String[] values = CSVUtil.parse(rule);
            if (dup.add(values[0]) == false) {
                throw new IllegalArgumentException("Found duplicate term [" + values[0] + "] in user dictionary.");
            }
            return rule;
        }
    
        public static UserDictionary getUserDictionary(Environment env, Settings settings) {
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sat Mar 15 06:51:20 UTC 2025
    - 4.7K bytes
    - Viewed (0)
  6. fess-crawler-lasta/src/main/resources/crawler.xml

    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml"/>
    	<include path="crawler/client.xml"/>
    	<include path="crawler/rule.xml"/>
    	<include path="crawler/filter.xml"/>
    	<include path="crawler/interval.xml"/>
    	<include path="crawler/extractor.xml"/>
    	<include path="crawler/mimetype.xml"/>
    	<include path="crawler/encoding.xml"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Tue Nov 28 13:40:25 UTC 2017
    - 1.7K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/AccessResult.java

         * @param sessionId the session identifier
         */
        void setSessionId(String sessionId);
    
        /**
         * Returns the rule identifier.
         *
         * @return the rule identifier
         */
        String getRuleId();
    
        /**
         * Sets the rule identifier.
         *
         * @param ruleId the rule identifier
         */
        void setRuleId(String ruleId);
    
        /**
         * Returns the URL of the accessed resource.
         *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5.2K bytes
    - Viewed (10)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/UrlConvertHelper.java

    /**
     * Helper class for converting URLs based on a set of predefined rules.
     *
     * <p>This class provides functionality to convert URLs by replacing parts of the URL
     * based on a map of target strings and their corresponding replacements. It allows
     * adding new conversion rules, setting the entire conversion map, and converting
     * URLs using these rules.</p>
     *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.1K bytes
    - Viewed (0)
  9. README.md

        controller.setDefaultIntervalTime(1000);
    });
    ```
    
    ### Sitemap Support
    
    ```java
    // Enable sitemap processing
    container.singleton("sitemapsRule", SitemapsRule.class, rule -> {
        rule.addRule("url", ".*sitemap.*");
    });
    
    // Add sitemap URL
    crawler.addUrl("https://example.com/sitemap.xml");
    ```
    
    ## Data Access and Storage
    
    ### Accessing Crawled Data
    
    ```java
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                    .<SitemapsRule> singleton("sitemapsRule", SitemapsRule.class, rule -> {
                        rule.setResponseProcessor(container.getComponent("sitemapsResponseProcessor"));
                        rule.setRuleId("sitemapsRule");
                        rule.addRule("url", ".*sitemap.*");
                    })//
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 19.1K bytes
    - Viewed (0)
Back to top