Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 7 of 7 for sitemapsRule (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/SitemapsRule.java

     *
     */
    public class SitemapsRule extends RegexRule {
        /**
         * Serial version UID for serialization.
         */
        private static final long serialVersionUID = 1L;
    
        private static final Logger logger = LogManager.getLogger(SitemapsRule.class);
    
        /**
         * Creates a new SitemapsRule instance.
         */
        public SitemapsRule() {
            super();
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/SitemapsRuleTest.java

        public SitemapsRule sitemapsRule;
    
        @Override
        protected void setUp() throws Exception {
            super.setUp();
            StandardCrawlerContainer container = new StandardCrawlerContainer().singleton("sitemapsHelper", SitemapsHelper.class)//
                    .singleton("sitemapsRule", SitemapsRule.class);
            sitemapsRule = container.getComponent("sitemapsRule");
        }
    
        public void test_match() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 4.7K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/RuleManagerImplTest.java

                    .singleton("sitemapsRule", SitemapsRule.class)//
                    .singleton("fileRule", RegexRule.class)//
                    .singleton("ruleManager", RuleManagerImpl.class);
    
            ruleManager = container.getComponent("ruleManager");
    
            SitemapsRule sitemapsRule = container.getComponent("sitemapsRule");
            sitemapsRule.setRuleId("sitemapsRule");
            sitemapsRule.addRule("url", ".*sitemap.*");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.2K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                    .singleton("sitemapsResponseProcessor", SitemapsResponseProcessor.class)//
                    .<SitemapsRule> singleton("sitemapsRule", SitemapsRule.class, rule -> {
                        rule.setResponseProcessor(container.getComponent("sitemapsResponseProcessor"));
                        rule.setRuleId("sitemapsRule");
                        rule.addRule("url", ".*sitemap.*");
                    })//
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  5. README.md

        controller.setDelayMillisForWaitingNewUrl(5000);
        controller.setDefaultIntervalTime(1000);
    });
    ```
    
    ### Sitemap Support
    
    ```java
    // Enable sitemap processing
    container.singleton("sitemapsRule", SitemapsRule.class, rule -> {
        rule.addRule("url", ".*sitemap.*");
    });
    
    // Add sitemap URL
    crawler.addUrl("https://example.com/sitemap.xml");
    ```
    
    ## Data Access and Storage
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                buf.append("</url>").append('\n');
                buf.append("</urlset>").append('\n');
                File sitemapsFile = new File(tempDir, "sitemaps.xml");
                FileUtil.writeBytes(sitemapsFile.getAbsolutePath(), buf.toString().getBytes("UTF-8"));
                robotTxtFile.deleteOnExit();
    
                // sitemaps.txt
                buf = new StringBuilder();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  7. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                buf.append("</url>").append('\n');
                buf.append("</urlset>").append('\n');
                File sitemapsFile = new File(tempDir, "sitemaps.xml");
                FileUtil.writeBytes(sitemapsFile.getAbsolutePath(), buf.toString().getBytes("UTF-8"));
                robotTxtFile.deleteOnExit();
    
                // sitemaps.txt
                buf = new StringBuilder();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
Back to top