- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 25 for sitemaps (0.04 sec)
-
fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/SitemapsHelperTest.java
final InputStream in = ResourceUtil.getResourceAsStream("sitemaps/sitemap1.xml"); final SitemapSet sitemapSet = sitemapsHelper.parse(in); final Sitemap[] sitemaps = sitemapSet.getSitemaps(); assertEquals(5, sitemaps.length); assertTrue(sitemapSet.isUrlSet()); assertFalse(sitemapSet.isIndex()); assertEquals("2005-01-01", sitemaps[0].getLastmod());
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 9.6K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/SitemapsRuleTest.java
responseData.setResponseBody(file, false); return responseData; } private ResponseData getTestData3_OK() { final ResponseData responseData = new ResponseData(); responseData.setUrl("http://example.com/sitemap.txt"); File file = ResourceUtil.getResourceAsFile("sitemaps/sitemap1.txt"); responseData.setResponseBody(file, false); return responseData; }
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 4.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapSet.java
* @param sitemap the sitemap to add */ public void addSitemap(final Sitemap sitemap) { sitemapList.add(sitemap); } /** * Removes a sitemap from this set. * @param sitemap the sitemap to remove */ public void removeSitemap(final Sitemap sitemap) { sitemapList.remove(sitemap); } /** * Gets all sitemaps in this set as an array.Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java
* and adds them as child URLs to be crawled. * * <p> * This class uses a {@link SitemapsHelper} to parse the sitemap XML or text. * It then iterates through the sitemaps in the SitemapSet, extracts the URL * from each sitemap, and creates a new {@link RequestData} object for each URL. * These RequestData objects are added to a set of child URLs, which are thenRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java
} /** * Adds sitemaps to the thread-local storage. * @param sitemaps An array of sitemap URLs. */ public void addSitemaps(final String[] sitemaps) { sitemapsLocal.set(sitemaps); } /** * Removes sitemaps from the thread-local storage and returns them. * @return An array of sitemap URLs, or null if none were present. */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 8.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java
/** * Helper class for parsing and validating sitemaps. * It supports XML sitemaps, XML sitemap indexes, and text sitemaps, * and can handle GZIP compressed sitemaps. * The class provides methods to check if an input stream is a valid sitemap, * and to parse an input stream into a {@link SitemapSet} object. * It uses SAX parser for XML sitemaps and XML sitemap indexes, * and handles potential exceptions during parsing.Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 14.7K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/RuleManagerImplTest.java
} public void test_getRule_sitemaps1() { final ResponseData responseData = new ResponseData(); responseData.setUrl("http://www.example.com/sitemap1.xml"); File file = ResourceUtil.getResourceAsFile("sitemaps/sitemap1.xml"); responseData.setResponseBody(file, false); final Rule rule = ruleManager.getRule(responseData); assertNotNull(rule);Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 6.2K bytes - Viewed (0) -
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 6.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/SitemapsRule.java
* represents a valid sitemap. It uses a SitemapsHelper to validate the response body as an InputStream. * The rule checks if the URL matches the defined regex pattern and then validates the content as a sitemap. * If any exception occurs during the sitemap validation, it logs the error and returns false. * */ public class SitemapsRule extends RegexRule { /**Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapFile.java
* and processing of Sitemap data. * </p> * * <p> * The {@code loc} attribute specifies the URL of the Sitemap, while the {@code lastmod} attribute * indicates the last time the Sitemap file was modified. The {@code lastmod} attribute is used by crawlers * to incrementally fetch sitemaps that have been updated since a certain date. * </p> * * <p>Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.4K bytes - Viewed (1)