Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 55 for sistema (0.08 sec)

  1. README.md

        controller.setDefaultIntervalTime(1000);
    });
    ```
    
    ### Sitemap Support
    
    ```java
    // Enable sitemap processing
    container.singleton("sitemapsRule", SitemapsRule.class, rule -> {
        rule.addRule("url", ".*sitemap.*");
    });
    
    // Add sitemap URL
    crawler.addUrl("https://example.com/sitemap.xml");
    ```
    
    ## Data Access and Storage
    
    ### Accessing Crawled Data
    
    ```java
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

                final Set<RequestData> requestDataSet = new LinkedHashSet<>();
                for (final Sitemap sitemap : sitemapSet.getSitemaps()) {
                    if (sitemap != null) {
                        requestDataSet.add(RequestDataBuilder.newRequestData().get().url(sitemap.getLoc()).build()); // TODO priority
                    }
                }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapSet.java

            sitemapList.add(sitemap);
        }
    
        /**
         * Removes a sitemap from this set.
         * @param sitemap the sitemap to remove
         */
        public void removeSitemap(final Sitemap sitemap) {
            sitemapList.remove(sitemap);
        }
    
        /**
         * Gets all sitemaps in this set as an array.
         * @return an array of sitemaps
         */
        public Sitemap[] getSitemaps() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.9K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java

            String[] sitemaps = new String[] { "http://example.com/sitemap.xml", "http://test.com/sitemap.xml" };
            crawlerContext.addSitemaps(sitemaps);
    
            // Remove and verify
            String[] removedSitemaps = crawlerContext.removeSitemaps();
            assertNotNull(removedSitemaps);
            assertEquals(2, removedSitemaps.length);
            assertEquals("http://example.com/sitemap.xml", removedSitemaps[0]);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 25.6K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapFile.java

    package org.codelibs.fess.crawler.entity;
    
    import org.codelibs.core.lang.StringUtil;
    
    /**
     * Represents a Sitemap file entry, conforming to the Sitemap XML format.
     * This class holds information about a single Sitemap, including its location and last modification timestamp.
     * It implements the {@link Sitemap} interface.
     *
     * <p>
     * A Sitemap file provides search engines with a list of URLs available for crawling.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.4K bytes
    - Viewed (1)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                final String sessionId = crawler.execute();
    
                // Wait for crawler to start running with polling
                long startTime = System.currentTimeMillis();
                while (crawler.crawlerContext.getStatus() != CrawlerStatus.RUNNING && System.currentTimeMillis() - startTime < 5000) {
                    try {
                        Thread.sleep(50);
                    } catch (InterruptedException e) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java

         *
         * @param in Input stream for a sitemap
         * @return a sitemap set
         */
        public SitemapSet parse(final InputStream in) {
            return parse(in, true);
        }
    
        /**
         * Parses a sitemap from the given input stream.
         * @param in the input stream to parse
         * @param recursive whether to recursively parse compressed files
         * @return the parsed sitemap set
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.7K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/SitemapsRule.java

     * represents a valid sitemap. It uses a SitemapsHelper to validate the response body as an InputStream.
     * The rule checks if the URL matches the defined regex pattern and then validates the content as a sitemap.
     * If any exception occurs during the sitemap validation, it logs the error and returns false.
     *
     */
    public class SitemapsRule extends RegexRule {
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/suggest/index/SuggestIndexer.java

                if (item == null) {
                    return new SuggestIndexResponse(0, 1, null, System.currentTimeMillis() - start);
                }
                final long parseTime = System.currentTimeMillis();
                final SuggestIndexResponse response = index(item);
                final long indexTime = System.currentTimeMillis();
                if (logger.isInfoEnabled()) {
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 34.8K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

        }
    
        /**
         * Adds a sitemap URL to the list of sitemaps.
         *
         * @param url The URL of the sitemap to be added
         */
        public void addSitemap(final String url) {
            if (!sitemapList.contains(url)) {
                sitemapList.add(url);
            }
        }
    
        /**
         * Returns an array of sitemap URLs.
         *
         * @return an array of sitemap URLs
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10K bytes
    - Viewed (0)
Back to top