Search Options

Results per page
Sort
Preferred Languages
Advance

Results 21 - 30 of 65 for urlset (0.02 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/ChildUrlsException.java

    /**
     * {@link ChildUrlsException} is thrown when child URLs are found during crawling.
     * It extends {@link CrawlerSystemException} and holds a set of {@link RequestData}
     * representing the child URLs that caused the exception.
     *
     */
    public class ChildUrlsException extends CrawlerSystemException {
    
        private static final long serialVersionUID = 1L;
    
        /**
         * The list of child URLs.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.8K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/IntervalController.java

     *   <li>{@code POST_PROCESSING} - Represents the post-processing state.</li>
     *   <li>{@code NO_URL_IN_QUEUE} - Indicates that there are no URLs in the queue.</li>
     *   <li>{@code WAIT_NEW_URL} - Indicates that the crawler is waiting for new URLs.</li>
     * </ul>
     */
    public interface IntervalController {
        /** Constant representing the pre-processing state. */
        int PRE_PROCESSING = 1;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.8K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientCreator.java

            }
        }
    
        /**
         * Registers a client component with a regular expression.
         * The component will be loaded into all registered CrawlerClientFactories.
         * @param regex The regular expression to match URLs.
         * @param componentName The name of the component to register.
         */
        public synchronized void register(final String regex, final String componentName) {
            clientMap.put(regex, componentName);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/UrlFilterService.java

         */
        void addIncludeUrlFilter(String sessionId, String url);
    
        /**
         * Adds a list of URLs to the include filter for a given session.
         *
         * @param sessionId the ID of the session for which the URLs should be included
         * @param urlList the list of URLs to be added to the include filter
         */
        void addIncludeUrlFilter(String sessionId, List<String> urlList);
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 3.1K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

                                InputStream in = null;
                                try {
                                    if (isByteStream) {
                                        inputStream.reset();
                                        in = inputStream;
                                    } else {
                                        in = new FileInputStream(tempFile);
                                    }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java

        }
    
        /**
         * Returns the set of robots.txt URLs.
         * @return The set of robots.txt URLs.
         */
        public Set<String> getRobotsTxtUrlSet() {
            return robotsTxtUrlSet;
        }
    
        /**
         * Sets the set of robots.txt URLs.
         * @param robotsTxtUrlSet The set of robots.txt URLs.
         */
        public void setRobotsTxtUrlSet(final Set<String> robotsTxtUrlSet) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.9K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ResultData.java

        protected String transformerName;
    
        /** The data of the result. */
        protected byte[] data;
    
        /** The encoding of the result. */
        protected String encoding;
    
        /** The set of the child URLs. */
        protected Set<RequestData> childUrlSet = new LinkedHashSet<>();
    
        /** The raw data. */
        protected Object rawData = null;
    
        /** The serializer. */
        protected Function<Object, byte[]> serializer;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.7K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/AbstractTransformerTest.java

            assertEquals("http://example.com/test", transformer.getLastResponseData().getUrl());
    
            // Reset and verify
            transformer.reset();
            assertEquals(0, transformer.getTransformCallCount());
            assertNull(transformer.getLastResponseData());
    
            // Name should persist after reset
            assertEquals("workflowTransformer", transformer.getName());
        }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 20.8K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/log/LogType.java

        REDIRECT_LOCATION,
        /** Indicates processing a response. */
        PROCESS_RESPONSE,
        /** Indicates the crawling process has finished. */
        FINISHED_CRAWLING,
        /** Indicates processing child URLs due to an exception. */
        PROCESS_CHILD_URLS_BY_EXCEPTION,
        /** Indicates processing a child URL due to an exception. */
        PROCESS_CHILD_URL_BY_EXCEPTION,
        /** Indicates an access exception during crawling. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.4K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java

         * influence the position of your URLs in a search engine's result pages.
         * Search engines may use this information when selecting between URLs on
         * the same site, so you can use this tag to increase the likelihood that
         * your most important pages are present in a search index.
         *
         * Also, please note that assigning a high priority to all of the URLs on
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
Back to top