- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 12 for Sitemap (0.11 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java
} /** * Adds a sitemap URL to the list of sitemaps. * * @param url The URL of the sitemap to be added */ public void addSitemap(final String url) { if (!sitemapList.contains(url)) { sitemapList.add(url); } } /** * Returns an array of sitemap URLs. * * @return an array of sitemap URLs */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java
} /** * Test sitemaps add and remove operations */ public void test_sitemaps() { // Initial state assertNull(crawlerContext.removeSitemaps()); // Add sitemaps String[] sitemaps = new String[] { "http://example.com/sitemap.xml", "http://test.com/sitemap.xml" }; crawlerContext.addSitemaps(sitemaps); // Remove and verify
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 25.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java
/** * Helper class for parsing and validating sitemaps. * It supports XML sitemaps, XML sitemap indexes, and text sitemaps, * and can handle GZIP compressed sitemaps. * The class provides methods to check if an input stream is a valid sitemap, * and to parse an input stream into a {@link SitemapSet} object. * It uses SAX parser for XML sitemaps and XML sitemap indexes, * and handles potential exceptions during parsing.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 14.7K bytes - Viewed (0) -
README.md
controller.setDefaultIntervalTime(1000); }); ``` ### Sitemap Support ```java // Enable sitemap processing container.singleton("sitemapsRule", SitemapsRule.class, rule -> { rule.addRule("url", ".*sitemap.*"); }); // Add sitemap URL crawler.addUrl("https://example.com/sitemap.xml"); ``` ## Data Access and Storage ### Accessing Crawled Data ```java
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Aug 31 05:32:52 UTC 2025 - 15.3K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
rule.setResponseProcessor(container.getComponent("sitemapsResponseProcessor")); rule.setRuleId("sitemapsRule"); rule.addRule("url", ".*sitemap.*"); })// .<DefaultResponseProcessor> singleton("defaultResponseProcessor", DefaultResponseProcessor.class, processor -> {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 19.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java
} /** * Adds sitemaps from robots.txt to the crawling queue. * @param urlQueue The URL queue to add sitemaps to. */ protected void addSitemapsFromRobotsTxt(final UrlQueue<?> urlQueue) { final String[] sitemaps = crawlerContext.removeSitemaps(); if (sitemaps != null) { for (final String childUrl : sitemaps) { try {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 20.4K bytes - Viewed (0) -
src/main/java/jcifs/smb1/http/NetworkExplorer.java
* Default constructor. */ public NetworkExplorer() { super(); } private static LogStream log = LogStream.getInstance(); /** The MIME type mapping */ private MimeMap mimeMap; /** The CSS style for HTML rendering */ private String style; /** The NTLM SSP handler */ private NtlmSsp ntlmSsp; /** Flag indicating if credentials were supplied */
Registered: Sun Sep 07 00:10:21 UTC 2025 - Last Modified: Sun Aug 31 08:00:57 UTC 2025 - 22.6K bytes - Viewed (0) -
docs/debugging/xl-meta/main.go
if i > 1 { file = fmt.Sprintf("%s/part.%d", file, i) filemap[file] = make(map[string]string) filemap[file][verID] = fmt.Sprintf("%s/part.%d/shard-%02d-of-%02d", verID, i, idx, ei.V2Obj.EcN+ei.V2Obj.EcM) filemap[file][verID+".json"] = buf.String() } partDataToVerID[dataFile] = [2]string{file, verID} }
Registered: Sun Sep 07 19:28:11 UTC 2025 - Last Modified: Fri Aug 29 02:39:48 UTC 2025 - 40.3K bytes - Viewed (0) -
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
file.delete(); file.mkdirs(); file.deleteOnExit(); fileTransformer.setPath(file.getAbsolutePath()); crawler.addUrl(url + "sitemaps.xml"); crawler.crawlerContext.setMaxAccessCount(maxCount); crawler.crawlerContext.setNumOfThread(numOfThread); crawler.urlFilter.addInclude(url + ".*");
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 12.8K bytes - Viewed (0) -
android/guava/src/com/google/common/collect/HashBiMap.java
*/ @GwtIncompatible @J2ktIncompatible private void writeObject(ObjectOutputStream stream) throws IOException { stream.defaultWriteObject(); Serialization.writeMap(this, stream); } @GwtIncompatible @J2ktIncompatible private void readObject(ObjectInputStream stream) throws IOException, ClassNotFoundException { stream.defaultReadObject();
Registered: Fri Sep 05 12:43:10 UTC 2025 - Last Modified: Mon Aug 11 19:31:30 UTC 2025 - 36.2K bytes - Viewed (0)