Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 29 for crawlerContainer (0.48 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

        /** Header name for location redirects. */
        protected static final String LOCATION_HEADER = "Location";
    
        /** The crawler container for dependency injection. */
        @Resource
        protected CrawlerContainer crawlerContainer;
    
        /** Map of parser features to configure the DOM parser. */
        protected Map<String, String> featureMap = new HashMap<>();
    
        /** Map of parser properties to configure the DOM parser. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 28.5K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImpl.java

            // NOP
        }
    
        private static final Logger logger = LogManager.getLogger(UrlFilterImpl.class);
    
        /**
         * The crawler container.
         */
        @Resource
        protected CrawlerContainer crawlerContainer;
    
        /**
         * The URL pattern.
         */
        protected String urlPattern = "^(.*:/+)([^/]*)(.*)$";
    
        /**
         * The include filtering pattern.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorFactory.java

        /** Container for managing crawler components */
        @Resource
        protected CrawlerContainer crawlerContainer;
    
        /** Map of keys to arrays of extractors */
        protected Map<String, Extractor[]> extractorMap = new HashMap<>();
    
        /**
         * Constructs a new ExtractorFactory.
         */
        public ExtractorFactory() {
            // Default constructor
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.3K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientFactory.java

        private static final Logger logger = LogManager.getLogger(CrawlerClientFactory.class);
    
        /**
         * The crawler container.
         */
        @Resource
        protected CrawlerContainer crawlerContainer;
    
        /**
         * A map of regular expression patterns to crawler clients.
         */
        protected Map<Pattern, CrawlerClient> clientMap = new LinkedHashMap<>();
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7K bytes
    - Viewed (0)
  5. fess-crawler-lasta/src/main/java/org/codelibs/fess/crawler/container/LastaCrawlerContainer.java

    package org.codelibs.fess.crawler.container;
    
    import org.lastaflute.di.core.factory.SingletonLaContainerFactory;
    
    /**
     * LastaFlute implementation of {@link CrawlerContainer}.
     *
     * @author shinsuke
     *
     */
    public class LastaCrawlerContainer implements CrawlerContainer {
    
        /**
         * Creates a new instance of LastaCrawlerContainer.
         */
        public LastaCrawlerContainer() {
            initialize();
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.4K bytes
    - Viewed (0)
  6. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

        private DataService dataService;
    
        @Resource
        private UrlQueueService urlQueueService;
    
        @Resource
        private FileTransformer fileTransformer;
    
        @Resource
        private CrawlerContainer crawlerContainer;
    
        @Override
        protected String prepareConfigFile() {
            return "crawler.xml";
        }
    
        public void test_execute_web() throws Exception {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 12.8K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

         */
        @Resource
        protected RuleManager ruleManager;
    
        /**
         * Container for managing crawler components.
         */
        @Resource
        protected CrawlerContainer crawlerContainer;
    
        /**
         * Controller for managing crawling intervals and delays.
         */
        @Resource
        protected IntervalController intervalController;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

         */
        @Resource
        protected DataService<AccessResult<?>> dataService;
    
        /**
         * Container for managing crawler components.
         */
        @Resource
        protected CrawlerContainer crawlerContainer;
    
        /**
         * Helper for logging crawler activities.
         */
        @Resource
        protected LogHelper logHelper;
    
        /**
         * Factory for creating crawler clients.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/AbstractCrawlerClient.java

        /** The property name for maximum cached content size. */
        public static final String MAX_CACHED_CONTENT_SIZE = "maxCachedContentSize";
    
        /** The crawler container. */
        @Resource
        protected CrawlerContainer crawlerContainer;
    
        /** The initialization parameter map. */
        protected Map<String, Object> initParamMap;
    
        /** The maximum cached content size in bytes. Default is 1MB. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 9.7K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/SitemapsRule.java

        public boolean match(final ResponseData responseData) {
            if (super.match(responseData)) {
                try (final InputStream is = responseData.getResponseBody()) {
                    final SitemapsHelper sitemapsHelper = crawlerContainer.getComponent("sitemapsHelper");
                    return sitemapsHelper.isValid(is);
                } catch (final CrawlingAccessException e) {
                    throw e;
                } catch (final Exception e) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
Back to top