Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 8 of 8 for addInclude (0.1 sec)

  1. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

            crawler.crawlerContext.setMaxAccessCount(maxCount);
            crawler.crawlerContext.setNumOfThread(numOfThread);
            crawler.urlFilter.addInclude(url + ".*");
            crawler.urlFilter.addExclude(url + "/dir1/.*");
            final String sessionId = crawler.execute();
            assertEquals(maxCount, dataService.getCount(sessionId));
            dataService.delete(sessionId);
        }
    
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:47:32 UTC 2024
    - 11.9K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImplTest.java

            assertFalse(urlFilter.match("http://test.com/a"));
    
        }
    
        public void test_match_include_case2() {
            urlFilter.addInclude("http://example.com/.*");
            urlFilter.addInclude("http://test.com/.*");
    
            final String sessionId = "id1";
            urlFilter.init(sessionId);
    
            assertTrue(urlFilter.match("http://example.com/"));
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 6.9K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImpl.java

            }
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.filter.UrlFilter#addInclude(java.lang.String)
         */
        @Override
        public void addInclude(final String urlPattern) {
            try {
                Pattern.compile(urlPattern);
            } catch (final Exception e) {
                if (logger.isWarnEnabled()) {
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:47:32 UTC 2024
    - 7.3K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

            crawler.crawlerContext.setMaxAccessCount(maxCount);
            crawler.crawlerContext.setNumOfThread(numOfThread);
            crawler.urlFilter.addInclude(url + ".*");
            crawler.urlFilter.addExclude(url + "/dir1/.*");
            final String sessionId = crawler.execute();
            assertEquals(maxCount, dataService.getCount(sessionId));
            dataService.delete(sessionId);
        }
    
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 18K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/UrlFilter.java

         * Add an url pattern as a target.
         *
         * @param urlPattern Regular expression that is crawled
         */
        void addInclude(String urlPattern);
    
        /**
         * Add an url pattern as a non-target.
         *
         * @param urlPattern Regular expression that is not crawled
         */
        void addExclude(String urlPattern);
    
        /**
         * Process an url when it's added as a seed url.
         *
         * @param url URL
         */
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 1.6K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

        }
    
        public void addIncludeFilter(final String regexp) {
            if (StringUtil.isNotBlank(regexp)) {
                urlFilter.addInclude(regexp);
            }
        }
    
        public void addExcludeFilter(final String regexp) {
            if (StringUtil.isNotBlank(regexp)) {
                urlFilter.addExclude(regexp);
            }
        }
    
        public void stop() {
            crawlerContext.setStatus(CrawlerStatus.DONE);
            try {
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:47:32 UTC 2024
    - 7.9K bytes
    - Viewed (0)
  7. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                crawler.addUrl(url);
                crawler.getCrawlerContext().setMaxAccessCount(maxCount);
                crawler.getCrawlerContext().setNumOfThread(numOfThread);
                crawler.urlFilter.addInclude(url + ".*");
                final String sessionId = crawler.execute();
                assertEquals(maxCount, dataService.getCount(sessionId));
                dataService.delete(sessionId);
            } finally {
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 7.7K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

                                            final String urlValue = hostUrl + urlPattern;
                                            crawlerContext.getUrlFilter().addInclude(urlValue);
                                            if (logger.isInfoEnabled()) {
                                                logger.info("Included URL: {}", urlValue);
                                            }
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu May 09 09:29:26 UTC 2024
    - 41K bytes
    - Viewed (0)
Back to top