Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 10 for addExclude (0.24 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

            // Test empty pattern
            urlFilter.addInclude("");
            urlFilter.addExclude("");
    
            // Test single character pattern
            urlFilter.addInclude(".");
            urlFilter.addExclude("*");
    
            // Test patterns with only special characters
            urlFilter.addInclude("^$");
            urlFilter.addExclude(".*");
    
            // Should handle boundary conditions gracefully
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImpl.java

         */
        protected UrlFilterService urlFilterService;
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.filter.UrlFilter#addExclude(java.lang.String)
         */
        @Override
        public void addExclude(final String urlPattern) {
            try {
                Pattern.compile(urlPattern);
            } catch (final Exception e) {
                if (logger.isWarnEnabled()) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  3. README.md

    ```
    
    ### URL Filtering
    
    ```java
    // Include patterns
    crawler.urlFilter.addInclude("https://example.com/.*");
    crawler.urlFilter.addInclude(".*\\.pdf$");
    
    // Exclude patterns  
    crawler.urlFilter.addExclude(".*\\.js$");
    crawler.urlFilter.addExclude(".*login.*");
    ```
    
    ## Supported Protocols and Formats
    
    ### Protocols
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  4. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

            crawler.crawlerContext.setMaxAccessCount(maxCount);
            crawler.crawlerContext.setNumOfThread(numOfThread);
            crawler.urlFilter.addInclude(url + ".*");
            crawler.urlFilter.addExclude(url + "/dir1/.*");
            final String sessionId = crawler.execute();
            assertEquals(maxCount, dataService.getCount(sessionId));
            dataService.delete(sessionId);
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 12.8K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

         */
        public void addExcludeFilter(final String regexp) {
            if (StringUtil.isNotBlank(regexp)) {
                urlFilter.addExclude(regexp);
            }
        }
    
        /**
         * Stops the crawling process.
         * Sets the crawler status to DONE and interrupts all crawler threads.
         */
        public void stop() {
            crawlerContext.setStatus(CrawlerStatus.DONE);
            try {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

            crawler.crawlerContext.setMaxAccessCount(maxCount);
            crawler.crawlerContext.setNumOfThread(numOfThread);
            crawler.urlFilter.addInclude(url + ".*");
            crawler.urlFilter.addExclude(url + "/dir1/.*");
            final String sessionId = crawler.execute();
            assertEquals(maxCount, dataService.getCount(sessionId));
            dataService.delete(sessionId);
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java

            @Override
            public void init(String sessionId) {
            }
    
            @Override
            public void addInclude(String urlPattern) {
            }
    
            @Override
            public void addExclude(String urlPattern) {
            }
    
            @Override
            public boolean match(String url) {
                return true;
            }
    
            @Override
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 25.6K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

                                            final String urlValue = hostUrl + urlPattern;
                                            crawlerContext.getUrlFilter().addExclude(urlValue);
                                            if (logger.isInfoEnabled()) {
                                                logger.info("Excluded URL: {}", urlValue);
                                            }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 52.2K bytes
    - Viewed (0)
  9. compat/maven-compat/src/main/java/org/apache/maven/DefaultArtifactFilterManager.java

        public ArtifactFilter getArtifactFilter() {
            Set<String> excludes = new LinkedHashSet<>(getExcludedArtifacts());
    
            for (ArtifactFilterManagerDelegate delegate : delegates) {
                delegate.addExcludes(excludes);
            }
    
            return new ExclusionSetFilter(excludes);
        }
    
        /**
         * Returns the artifact filter for the standard core artifacts.
         *
    Registered: Sun Sep 07 03:35:12 UTC 2025
    - Last Modified: Fri Jun 06 14:28:57 UTC 2025
    - 3.1K bytes
    - Viewed (0)
  10. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                crawler.addUrl(url);
                crawler.getCrawlerContext().setMaxAccessCount(maxCount);
                crawler.getCrawlerContext().setNumOfThread(numOfThread);
                crawler.urlFilter.addInclude(url + ".*");
                final String sessionId = crawler.execute();
                assertEquals(maxCount, dataService.getCount(sessionId));
                dataService.delete(sessionId);
            } finally {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 7.7K bytes
    - Viewed (0)
Back to top