Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 5 of 5 for urlFilters (2.47 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

        /**
         * Returns the URL filter.
         * @return The UrlFilter instance.
         */
        public UrlFilter getUrlFilter() {
            return urlFilter;
        }
    
        /**
         * Sets the URL filter.
         * @param urlFilter The UrlFilter instance to set.
         */
        public void setUrlFilter(final UrlFilter urlFilter) {
            this.urlFilter = urlFilter;
        }
    
        /**
         * Returns the rule manager.
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 17K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerThreadTest.java

            crawlerContainer = mock(CrawlerContainer.class);
            logHelper = mock(LogHelper.class);
            clientFactory = mock(CrawlerClientFactory.class);
            urlFilter = mock(UrlFilter.class);
            ruleManager = mock(RuleManager.class);
    
            crawlerContext.urlFilter = urlFilter;
            crawlerContext.ruleManager = ruleManager;
    
            crawlerThread.urlQueueService = urlQueueService;
            crawlerThread.dataService = dataService;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 18.3K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/helper/WebFsIndexHelper.java

                    try {
                        urlFilterService.delete(sid);
                    } catch (final Exception e) {
                        logger.warn("Failed to delete UrlFilter: sessionId={}", sid);
                    }
                }
    
                final DuplicateHostHelper duplicateHostHelper = ComponentUtil.getDuplicateHostHelper();
    
                // set urls
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 25K bytes
    - Viewed (0)
  4. CLAUDE.md

    ```
    
    3. **Add test with sample file** in `src/test/resources/`
    
    ### Configuring URL Filtering
    
    ```java
    // Include patterns (must match)
    crawler.urlFilter.addInclude("https://example.com/.*");
    
    // Exclude patterns (must not match)
    crawler.urlFilter.addExclude(".*\\.(css|js|png|jpg)$");
    ```
    
    ### Setting Crawl Limits
    
    ```java
    context.setMaxAccessCount(1000);  // Max URLs (0 = unlimited)
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 28 17:31:34 UTC 2025
    - 10.7K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/indexer/IndexUpdater.java

         */
        private void deleteBySessionId(final String sessionId) {
            try {
                urlFilterService.delete(sessionId);
            } catch (final Exception e) {
                logger.warn("Failed to delete UrlFilter: sessionId={}", sessionId, e);
            }
            try {
                urlQueueService.delete(sessionId);
            } catch (final Exception e) {
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 32.9K bytes
    - Viewed (0)
Back to top