- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 44 for Sitemaps (1.22 sec)
-
fess-crawler-lasta/src/main/resources/crawler/sitemaps.xml
Shinsuke Sugaya <******@****.***> 1444529815 +0900
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 365 bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/SitemapsRuleTest.java
responseData.setResponseBody(file, false); return responseData; } private ResponseData getTestData3_OK() { final ResponseData responseData = new ResponseData(); responseData.setUrl("http://example.com/sitemap.txt"); File file = ResourceUtil.getResourceAsFile("sitemaps/sitemap1.txt"); responseData.setResponseBody(file, false); return responseData; }
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 4.7K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/SitemapsHelperTest.java
assertNull(((SitemapUrl) sitemaps[0]).getPriority()); assertNull(sitemaps[1].getLastmod()); assertEquals("http://www.example.com/catalog?item=12&desc=vacation_hawaii", sitemaps[1].getLoc()); assertNull(((SitemapUrl) sitemaps[1]).getChangefreq()); assertNull(((SitemapUrl) sitemaps[1]).getPriority()); assertNull(sitemaps[2].getLastmod());
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Mon Nov 24 03:59:47 UTC 2025 - 36.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java
} /** * Adds sitemaps to the thread-local storage. * @param sitemaps An array of sitemap URLs. */ public void addSitemaps(final String[] sitemaps) { sitemapsLocal.set(sitemaps); } /** * Removes sitemaps from the thread-local storage and returns them. * @return An array of sitemap URLs, or null if none were present. */Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 8.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java
* and adds them as child URLs to be crawled. * * <p> * This class uses a {@link SitemapsHelper} to parse the sitemap XML or text. * It then iterates through the sitemaps in the SitemapSet, extracts the URL * from each sitemap, and creates a new {@link RequestData} object for each URL. * These RequestData objects are added to a set of child URLs, which are thenRegistered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.4K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/entity/RobotsTxtTest.java
robotsTxt.addSitemap("https://example.com/sitemap.xml"); robotsTxt.addSitemap("https://example.com/sitemap2.xml"); String[] sitemaps = robotsTxt.getSitemaps(); assertEquals(2, sitemaps.length); assertEquals("https://example.com/sitemap.xml", sitemaps[0]); assertEquals("https://example.com/sitemap2.xml", sitemaps[1]); } public void test_addSitemapNoDuplicates() {Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Thu Nov 13 13:29:22 UTC 2025 - 14.4K bytes - Viewed (0) -
fess-crawler/src/test/resources/sitemaps/sitemap2.xml
<?xml version="1.0" encoding="UTF-8"?> <sitemapindex xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"> <sitemap> <loc>http://www.example.com/sitemap1.xml.gz</loc> <lastmod>2004-10-01T18:23:17+00:00</lastmod> </sitemap> <sitemap> <loc>http://www.example.com/sitemap2.xml.gz</loc> <lastmod>2005-01-01</lastmod> </sitemap>Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 376 bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/RuleManagerImplTest.java
} public void test_getRule_sitemaps1() { final ResponseData responseData = new ResponseData(); responseData.setUrl("http://www.example.com/sitemap1.xml"); File file = ResourceUtil.getResourceAsFile("sitemaps/sitemap1.xml"); responseData.setResponseBody(file, false); final Rule rule = ruleManager.getRule(responseData); assertNotNull(rule);Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 6.2K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapImage.java
* </p> * * @see <a href="https://developers.google.com/search/docs/crawling-indexing/sitemaps/image-sitemaps">Google Image Sitemaps</a> */ public class SitemapImage implements Serializable { private static final long serialVersionUID = 1L; /** * The URL of the image. * In some cases, the image URL may not be on the same domain as your main site. */ private String loc;Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Thu Nov 13 13:34:36 UTC 2025 - 3.8K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/RobotsTxtHelperTest.java
assertTrue(robotsTxt.allows("/priceinfo", "DollarBot")); // Test sitemaps String[] sitemaps = robotsTxt.getSitemaps(); assertEquals(1, sitemaps.length); assertEquals("http://www.example.com/sitemap.xml", sitemaps[0]); } public void testParse_malformed() { RobotsTxt robotsTxt;
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Mon Nov 24 03:59:47 UTC 2025 - 20.6K bytes - Viewed (0)