Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 71 for sistema (0.03 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/Sitemap.java

    import java.io.Serializable;
    
    /**
     * The Sitemap interface represents a sitemap entity with location and last modification date.
     * It extends the Serializable interface to allow sitemap objects to be serialized.
     */
    public interface Sitemap extends Serializable {
    
        /**
         * Retrieves the location (URL) of the sitemap.
         *
         * @return the location of the sitemap as a String.
         */
        String getLoc();
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.2K bytes
    - Viewed (0)
  2. README.md

        controller.setDefaultIntervalTime(1000);
    });
    ```
    
    ### Sitemap Support
    
    ```java
    // Enable sitemap processing
    container.singleton("sitemapsRule", SitemapsRule.class, rule -> {
        rule.addRule("url", ".*sitemap.*");
    });
    
    // Add sitemap URL
    crawler.addUrl("https://example.com/sitemap.xml");
    ```
    
    ## Data Access and Storage
    
    ### Accessing Crawled Data
    
    ```java
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

                final Set<RequestData> requestDataSet = new LinkedHashSet<>();
                for (final Sitemap sitemap : sitemapSet.getSitemaps()) {
                    if (sitemap != null) {
                        requestDataSet.add(RequestDataBuilder.newRequestData().get().url(sitemap.getLoc()).build()); // TODO priority
                    }
                }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapSet.java

            sitemapList.add(sitemap);
        }
    
        /**
         * Removes a sitemap from this set.
         * @param sitemap the sitemap to remove
         */
        public void removeSitemap(final Sitemap sitemap) {
            sitemapList.remove(sitemap);
        }
    
        /**
         * Gets all sitemaps in this set as an array.
         * @return an array of sitemaps
         */
        public Sitemap[] getSitemaps() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.9K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/SitemapsRuleTest.java

            sitemapsRule.addRule("url", Pattern.compile(".*sitemap.*"));
            assertTrue(sitemapsRule.match(responseData));
            InputStream is = responseData.getResponseBody();
            assertTrue(is instanceof InputStream);
            CloseableUtil.closeQuietly(responseData);
        }
    
        private void assertMatchFalse(ResponseData responseData) {
            sitemapsRule.addRule("url", Pattern.compile(".*sitemap.*"));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 4.7K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java

            String[] sitemaps = new String[] { "http://example.com/sitemap.xml", "http://test.com/sitemap.xml" };
            crawlerContext.addSitemaps(sitemaps);
    
            // Remove and verify
            String[] removedSitemaps = crawlerContext.removeSitemaps();
            assertNotNull(removedSitemaps);
            assertEquals(2, removedSitemaps.length);
            assertEquals("http://example.com/sitemap.xml", removedSitemaps[0]);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 25.6K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapFile.java

    package org.codelibs.fess.crawler.entity;
    
    import org.codelibs.core.lang.StringUtil;
    
    /**
     * Represents a Sitemap file entry, conforming to the Sitemap XML format.
     * This class holds information about a single Sitemap, including its location and last modification timestamp.
     * It implements the {@link Sitemap} interface.
     *
     * <p>
     * A Sitemap file provides search engines with a list of URLs available for crawling.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.4K bytes
    - Viewed (1)
  8. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/service/impl/OpenSearchDataServiceTest.java

            accessResult1.setContentLength(Long.valueOf(10));
            accessResult1.setCreateTime(System.currentTimeMillis());
            accessResult1.setExecutionTime(10);
            accessResult1.setHttpStatusCode(200);
            accessResult1.setLastModified(System.currentTimeMillis());
            accessResult1.setMethod("GET");
            accessResult1.setMimeType("text/plain");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.8K bytes
    - Viewed (0)
  9. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                final String sessionId = crawler.execute();
    
                // Wait for crawler to start running with polling
                long startTime = System.currentTimeMillis();
                while (crawler.crawlerContext.getStatus() != CrawlerStatus.RUNNING && System.currentTimeMillis() - startTime < 5000) {
                    try {
                        Thread.sleep(50);
                    } catch (InterruptedException e) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java

         *
         * @param in Input stream for a sitemap
         * @return a sitemap set
         */
        public SitemapSet parse(final InputStream in) {
            return parse(in, true);
        }
    
        /**
         * Parses a sitemap from the given input stream.
         * @param in the input stream to parse
         * @param recursive whether to recursively parse compressed files
         * @return the parsed sitemap set
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.7K bytes
    - Viewed (0)
Back to top