- Sort Score
- Result 10 results
- Languages All
Results 11 - 20 of 55 for sitemaps (0.07 sec)
-
fess-crawler/src/test/resources/sitemaps/sitemap1.xml
<?xml version="1.0" encoding="UTF-8"?> <urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"> <url> <loc>http://www.example.com/</loc> <lastmod>2005-01-01</lastmod> <changefreq>monthly</changefreq> <priority>0.8</priority> </url> <url> <loc>http://www.example.com/catalog?item=12&desc=vacation_hawaii</loc> <changefreq>weekly</changefreq> </url> <url>
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 915 bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapFile.java
* Sitemap were changed. The value for the lastmod tag should be in W3C * Datetime format. * * By providing the last modification timestamp, you enable search engine * crawlers to retrieve only a subset of the Sitemaps in the index i.e. a * crawler may only retrieve Sitemaps that were modified since a certain * date. This incremental Sitemap fetching mechanism allows for the rapid
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 2.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java
} protected void addSitemapsFromRobotsTxt(final UrlQueue<?> urlQueue) { final String[] sitemaps = crawlerContext.removeSitemaps(); if (sitemaps != null) { for (final String childUrl : sitemaps) { try { storeChildUrl(childUrl, urlQueue.getUrl(), null, urlQueue.getDepth() == null ? 1 : urlQueue.getDepth() + 1);
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sat Oct 12 01:41:37 UTC 2024 - 15.5K bytes - Viewed (0) -
fess-crawler-opensearch/src/main/resources/crawler_opensearch.xml
<include path="crawler/mimetype.xml"/> <include path="crawler/encoding.xml"/> <include path="crawler/urlconverter.xml"/> <include path="crawler/log.xml"/> <include path="crawler/sitemaps.xml"/> <include path="crawler/opensearch.xml"/> <!-- Crawler --> <component name="crawler" class="org.codelibs.fess.crawler.Crawler" instance="prototype" > </component> <!-- Crawler Thread -->
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Nov 07 04:44:10 UTC 2024 - 2.2K bytes - Viewed (0) -
fess-crawler-lasta/src/main/resources/crawler.xml
<include path="crawler/extractor.xml"/> <include path="crawler/mimetype.xml"/> <include path="crawler/encoding.xml"/> <include path="crawler/urlconverter.xml"/> <include path="crawler/log.xml"/> <include path="crawler/sitemaps.xml"/> <!-- Crawler --> <component name="crawler" class="org.codelibs.fess.crawler.Crawler" instance="prototype" > </component> <!-- Crawler Thread -->
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Tue Nov 28 13:40:25 UTC 2017 - 1.7K bytes - Viewed (0) -
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
file.delete(); file.mkdirs(); file.deleteOnExit(); fileTransformer.setPath(file.getAbsolutePath()); crawler.addUrl(url + "sitemaps.xml"); crawler.crawlerContext.setMaxAccessCount(maxCount); crawler.crawlerContext.setNumOfThread(numOfThread); crawler.urlFilter.addInclude(url + ".*");
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:47:32 UTC 2024 - 11.9K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
file.delete(); file.mkdirs(); file.deleteOnExit(); fileTransformer.setPath(file.getAbsolutePath()); crawler.addUrl(url + "sitemaps.xml"); crawler.crawlerContext.setMaxAccessCount(maxCount); crawler.crawlerContext.setNumOfThread(numOfThread); crawler.urlFilter.addInclude(url + ".*");
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 18K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java
if (robotsTxt != null) { final String[] sitemaps = robotsTxt.getSitemaps(); if (sitemaps.length > 0) { crawlerContext.addSitemaps(sitemaps); } final RobotsTxt.Directive directive = robotsTxt.getMatchedDirective(userAgent);
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu May 09 09:29:26 UTC 2024 - 41K bytes - Viewed (0) -
fess-crawler/src/test/resources/sitemaps/sitemap2.xml.gz
sitemap2.xml http://www.example.com/sitemap1.xml.gz 2004-10-01T18:23:17+00:00 http://www.example.com/sitemap2.xml.gz 2005-01-01...
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 217 bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapSet.java
public void removeSitemap(final Sitemap sitemap) { sitemapList.remove(sitemap); } public Sitemap[] getSitemaps() { return sitemapList.toArray(new Sitemap[sitemapList.size()]); } public void setType(final String type) { this.type = type; } public boolean isUrlSet() { return URLSET.equals(type); } public boolean isIndex() {
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 1.7K bytes - Viewed (0)