- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 71 for sistema (0.04 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/Sitemap.java
import java.io.Serializable; /** * The Sitemap interface represents a sitemap entity with location and last modification date. * It extends the Serializable interface to allow sitemap objects to be serialized. */ public interface Sitemap extends Serializable { /** * Retrieves the location (URL) of the sitemap. * * @return the location of the sitemap as a String. */ String getLoc();Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 1.2K bytes - Viewed (0) -
README.md
controller.setDefaultIntervalTime(1000); }); ``` ### Sitemap Support ```java // Enable sitemap processing container.singleton("sitemapsRule", SitemapsRule.class, rule -> { rule.addRule("url", ".*sitemap.*"); }); // Add sitemap URL crawler.addUrl("https://example.com/sitemap.xml"); ``` ## Data Access and Storage ### Accessing Crawled Data ```java
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Aug 31 05:32:52 UTC 2025 - 15.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java
final Set<RequestData> requestDataSet = new LinkedHashSet<>(); for (final Sitemap sitemap : sitemapSet.getSitemaps()) { if (sitemap != null) { requestDataSet.add(RequestDataBuilder.newRequestData().get().url(sitemap.getLoc()).build()); // TODO priority } }
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapSet.java
sitemapList.add(sitemap); } /** * Removes a sitemap from this set. * @param sitemap the sitemap to remove */ public void removeSitemap(final Sitemap sitemap) { sitemapList.remove(sitemap); } /** * Gets all sitemaps in this set as an array. * @return an array of sitemaps */ public Sitemap[] getSitemaps() {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2.9K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/SitemapsRuleTest.java
sitemapsRule.addRule("url", Pattern.compile(".*sitemap.*")); assertTrue(sitemapsRule.match(responseData)); InputStream is = responseData.getResponseBody(); assertTrue(is instanceof InputStream); CloseableUtil.closeQuietly(responseData); } private void assertMatchFalse(ResponseData responseData) { sitemapsRule.addRule("url", Pattern.compile(".*sitemap.*"));
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 4.7K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java
String[] sitemaps = new String[] { "http://example.com/sitemap.xml", "http://test.com/sitemap.xml" }; crawlerContext.addSitemaps(sitemaps); // Remove and verify String[] removedSitemaps = crawlerContext.removeSitemaps(); assertNotNull(removedSitemaps); assertEquals(2, removedSitemaps.length); assertEquals("http://example.com/sitemap.xml", removedSitemaps[0]);
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 25.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapFile.java
package org.codelibs.fess.crawler.entity; import org.codelibs.core.lang.StringUtil; /** * Represents a Sitemap file entry, conforming to the Sitemap XML format. * This class holds information about a single Sitemap, including its location and last modification timestamp. * It implements the {@link Sitemap} interface. * * <p> * A Sitemap file provides search engines with a list of URLs available for crawling.Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.4K bytes - Viewed (1) -
fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/service/impl/OpenSearchDataServiceTest.java
accessResult1.setContentLength(Long.valueOf(10)); accessResult1.setCreateTime(System.currentTimeMillis()); accessResult1.setExecutionTime(10); accessResult1.setHttpStatusCode(200); accessResult1.setLastModified(System.currentTimeMillis()); accessResult1.setMethod("GET"); accessResult1.setMimeType("text/plain");
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 6.8K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
final String sessionId = crawler.execute(); // Wait for crawler to start running with polling long startTime = System.currentTimeMillis(); while (crawler.crawlerContext.getStatus() != CrawlerStatus.RUNNING && System.currentTimeMillis() - startTime < 5000) { try { Thread.sleep(50); } catch (InterruptedException e) {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 19.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java
* * @param in Input stream for a sitemap * @return a sitemap set */ public SitemapSet parse(final InputStream in) { return parse(in, true); } /** * Parses a sitemap from the given input stream. * @param in the input stream to parse * @param recursive whether to recursively parse compressed files * @return the parsed sitemap set */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 14.7K bytes - Viewed (0)