Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 55 for sitemaps (0.11 sec)

  1. fess-crawler/src/test/resources/sitemaps/sitemap1.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
       <url>
          <loc>http://www.example.com/</loc>
          <lastmod>2005-01-01</lastmod>
          <changefreq>monthly</changefreq>
          <priority>0.8</priority>
       </url>
       <url>
          <loc>http://www.example.com/catalog?item=12&amp;desc=vacation_hawaii</loc>
          <changefreq>weekly</changefreq>
       </url>
       <url>
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 915 bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapFile.java

         * Sitemap were changed. The value for the lastmod tag should be in W3C
         * Datetime format.
         *
         * By providing the last modification timestamp, you enable search engine
         * crawlers to retrieve only a subset of the Sitemaps in the index i.e. a
         * crawler may only retrieve Sitemaps that were modified since a certain
         * date. This incremental Sitemap fetching mechanism allows for the rapid
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 2.7K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

        }
    
        protected void addSitemapsFromRobotsTxt(final UrlQueue<?> urlQueue) {
            final String[] sitemaps = crawlerContext.removeSitemaps();
            if (sitemaps != null) {
                for (final String childUrl : sitemaps) {
                    try {
                        storeChildUrl(childUrl, urlQueue.getUrl(), null, urlQueue.getDepth() == null ? 1 : urlQueue.getDepth() + 1);
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sat Oct 12 01:41:37 UTC 2024
    - 15.5K bytes
    - Viewed (0)
  4. fess-crawler-opensearch/src/main/resources/crawler_opensearch.xml

        <include path="crawler/mimetype.xml"/>
        <include path="crawler/encoding.xml"/>
        <include path="crawler/urlconverter.xml"/>
        <include path="crawler/log.xml"/>
        <include path="crawler/sitemaps.xml"/>
    
        <include path="crawler/opensearch.xml"/>
    
    	<!-- Crawler -->
    	<component name="crawler" class="org.codelibs.fess.crawler.Crawler" instance="prototype" >
    	</component>
    
    	<!-- Crawler Thread -->
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 2.2K bytes
    - Viewed (0)
  5. fess-crawler-lasta/src/main/resources/crawler.xml

    	<include path="crawler/extractor.xml"/>
    	<include path="crawler/mimetype.xml"/>
    	<include path="crawler/encoding.xml"/>
    	<include path="crawler/urlconverter.xml"/>
    	<include path="crawler/log.xml"/>
    	<include path="crawler/sitemaps.xml"/>
    
    	<!-- Crawler -->
    	<component name="crawler" class="org.codelibs.fess.crawler.Crawler" instance="prototype" >
    	</component>
    
    	<!-- Crawler Thread -->
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Tue Nov 28 13:40:25 UTC 2017
    - 1.7K bytes
    - Viewed (0)
  6. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                file.delete();
                file.mkdirs();
                file.deleteOnExit();
                fileTransformer.setPath(file.getAbsolutePath());
                crawler.addUrl(url + "sitemaps.xml");
                crawler.crawlerContext.setMaxAccessCount(maxCount);
                crawler.crawlerContext.setNumOfThread(numOfThread);
                crawler.urlFilter.addInclude(url + ".*");
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:47:32 UTC 2024
    - 11.9K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                file.delete();
                file.mkdirs();
                file.deleteOnExit();
                fileTransformer.setPath(file.getAbsolutePath());
                crawler.addUrl(url + "sitemaps.xml");
                crawler.crawlerContext.setMaxAccessCount(maxCount);
                crawler.crawlerContext.setNumOfThread(numOfThread);
                crawler.urlFilter.addInclude(url + ".*");
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 18K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

                        if (robotsTxt != null) {
                            final String[] sitemaps = robotsTxt.getSitemaps();
                            if (sitemaps.length > 0) {
                                crawlerContext.addSitemaps(sitemaps);
                            }
    
                            final RobotsTxt.Directive directive = robotsTxt.getMatchedDirective(userAgent);
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu May 09 09:29:26 UTC 2024
    - 41K bytes
    - Viewed (0)
  9. fess-crawler/src/test/resources/sitemaps/sitemap2.xml.gz

    sitemap2.xml http://www.example.com/sitemap1.xml.gz 2004-10-01T18:23:17+00:00 http://www.example.com/sitemap2.xml.gz 2005-01-01...
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 217 bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapSet.java

        public void removeSitemap(final Sitemap sitemap) {
            sitemapList.remove(sitemap);
        }
    
        public Sitemap[] getSitemaps() {
            return sitemapList.toArray(new Sitemap[sitemapList.size()]);
        }
    
        public void setType(final String type) {
            this.type = type;
        }
    
        public boolean isUrlSet() {
            return URLSET.equals(type);
        }
    
        public boolean isIndex() {
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 1.7K bytes
    - Viewed (0)
Back to top