Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 58 for Burles (0.1 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

    import jakarta.annotation.Resource;
    
    /**
     * A response processor implementation that handles sitemaps.
     * It parses the response body as a SitemapSet, extracts URLs from the sitemaps,
     * and adds them as child URLs to be crawled.
     *
     * <p>
     * This class uses a {@link SitemapsHelper} to parse the sitemap XML or text.
     * It then iterates through the sitemaps in the SitemapSet, extracts the URL
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

         */
        @Resource
        protected DataService<AccessResult<?>> dataService;
    
        /**
         * Filter for URLs to control which URLs are crawled.
         */
        @Resource
        protected UrlFilter urlFilter;
    
        /**
         * Manager for crawling rules and configurations.
         */
        @Resource
        protected RuleManager ruleManager;
    
        /**
         * Container for managing crawler components.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/Rule.java

    import java.io.Serializable;
    
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.processor.ResponseProcessor;
    
    /**
     * The Rule interface defines the contract for implementing rules that can be applied to
     * response data in a web crawler. Implementations of this interface should provide logic
     * to determine if a given response data matches the rule, retrieve the rule's identifier,
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.7K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/IntervalController.java

     *   <li>{@code POST_PROCESSING} - Represents the post-processing state.</li>
     *   <li>{@code NO_URL_IN_QUEUE} - Indicates that there are no URLs in the queue.</li>
     *   <li>{@code WAIT_NEW_URL} - Indicates that the crawler is waiting for new URLs.</li>
     * </ul>
     */
    public interface IntervalController {
        /** Constant representing the pre-processing state. */
        int PRE_PROCESSING = 1;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.8K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/ChildUrlsException.java

    /**
     * {@link ChildUrlsException} is thrown when child URLs are found during crawling.
     * It extends {@link CrawlerSystemException} and holds a set of {@link RequestData}
     * representing the child URLs that caused the exception.
     *
     */
    public class ChildUrlsException extends CrawlerSystemException {
    
        private static final long serialVersionUID = 1L;
    
        /**
         * The list of child URLs.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.8K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/RuleManagerImpl.java

    import org.codelibs.fess.crawler.rule.RuleManager;
    
    /**
     * Implementation of the {@link RuleManager} interface.
     * Manages a list of rules for the crawler.
     * Provides methods to add, remove, check, and retrieve rules.
     *
     */
    public class RuleManagerImpl implements RuleManager {
    
        /** The list of rules managed by this rule manager. */
        protected final List<Rule> ruleList = new ArrayList<>();
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/TransformerTest.java

            StatefulTransformer transformer = new StatefulTransformer("statefulTransformer");
    
            // Process multiple URLs
            String[] urls = { "http://example1.com", "http://example2.com", "http://example3.com" };
    
            for (String url : urls) {
                ResponseData responseData = new ResponseData();
                responseData.setUrl(url);
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 28K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientCreator.java

            }
        }
    
        /**
         * Registers a client component with a regular expression.
         * The component will be loaded into all registered CrawlerClientFactories.
         * @param regex The regular expression to match URLs.
         * @param componentName The name of the component to register.
         */
        public synchronized void register(final String regex, final String componentName) {
            clientMap.put(regex, componentName);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/UrlFilterService.java

         */
        void addIncludeUrlFilter(String sessionId, String url);
    
        /**
         * Adds a list of URLs to the include filter for a given session.
         *
         * @param sessionId the ID of the session for which the URLs should be included
         * @param urlList the list of URLs to be added to the include filter
         */
        void addIncludeUrlFilter(String sessionId, List<String> urlList);
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 3.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/AbstractRule.java

    import jakarta.annotation.Resource;
    
    /**
     * Abstract base class for implementing {@link Rule} interfaces.
     * Provides common functionality and properties for crawler rules.
     *
     * <p>
     * This class handles the registration of rules with the {@link RuleManager}
     * and provides getter and setter methods for common properties such as
     * {@code ruleId} and {@code responseProcessor}.
     * </p>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 2.8K bytes
    - Viewed (0)
Back to top