- Sort Score
- Result 10 results
- Languages All
Results 11 - 20 of 49 for Sitemap (0.09 sec)
-
fess-crawler/src/test/resources/sitemaps/sitemap1.xml
<?xml version="1.0" encoding="UTF-8"?> <urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"> <url> <loc>http://www.example.com/</loc> <lastmod>2005-01-01</lastmod> <changefreq>monthly</changefreq> <priority>0.8</priority> </url> <url> <loc>http://www.example.com/catalog?item=12&desc=vacation_hawaii</loc> <changefreq>weekly</changefreq> </url> <url>
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 915 bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java
} return false; } /** * Generates SitemapSet instance. * * This method does not close the input stream. * * @param in Input stream for a sitemap * @return a sitemap set */ public SitemapSet parse(final InputStream in) { return parse(in, true); } protected SitemapSet parse(final InputStream in, final boolean recursive) {
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sat Oct 12 01:40:57 UTC 2024 - 11.8K bytes - Viewed (0) -
fess-crawler-lasta/src/main/resources/crawler/rule.xml
<component class="org.codelibs.fess.crawler.processor.impl.SitemapsResponseProcessor"> </component> </property> <postConstruct name="addRule"> <arg>"url"</arg> <arg>".*sitemap.*"</arg> </postConstruct> </component> <component name="fileRule" class="org.codelibs.fess.crawler.rule.impl.RegexRule"> <property name="ruleId">"fileRule"</property> <property name="defaultRule">true</property>
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 1.5K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 6.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/SitemapsRule.java
} catch (final CrawlingAccessException e) { throw e; } catch (final Exception e) { if (logger.isDebugEnabled()) { logger.debug("Failed a sitemap check: {}", responseData, e); } } } return false; }
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 1.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java
*/ package org.codelibs.fess.crawler.entity; import org.codelibs.core.lang.StringUtil; /** * @author shinsuke * */ public class SitemapUrl implements Sitemap { private static final long serialVersionUID = 1L; /** * URL of the page. This URL must begin with the protocol (such as http) and
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 4.9K bytes - Viewed (0) -
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 6.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java
protected static final Pattern CRAWL_DELAY_RECORD = Pattern.compile("^crawl-delay:\\s*([^\\s]+)\\s*$", Pattern.CASE_INSENSITIVE); protected static final Pattern SITEMAP_RECORD = Pattern.compile("^sitemap:\\s*([^\\s]+)\\s*$", Pattern.CASE_INSENSITIVE); protected boolean enabled = true; public RobotsTxt parse(final InputStream stream) { return parse(stream, Constants.UTF_8); }
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sat Oct 12 01:40:57 UTC 2024 - 6.1K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
rule.setResponseProcessor(container.getComponent("sitemapsResponseProcessor")); rule.setRuleId("sitemapsRule"); rule.addRule("url", ".*sitemap.*"); })// .<DefaultResponseProcessor> singleton("defaultResponseProcessor", DefaultResponseProcessor.class, processor -> {
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 18K bytes - Viewed (0) -
fess-crawler/src/test/resources/sitemaps/sitemap2.xml.gz
sitemap2.xml http://www.example.com/sitemap1.xml.gz 2004-10-01T18:23:17+00:00 http://www.example.com/sitemap2.xml.gz 2005-01-01...
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 217 bytes - Viewed (0)