Search Options

Display Count
Sort
Preferred Language
Advanced Search

Results 1 - 10 of 101 for URLs (0.03 seconds)

  1. src/test/java/org/codelibs/fess/helper/NotificationHelperTest.java

            } catch (Exception e) {
                fail("sendToSlack() should not throw an exception with blank URLs: " + e.getMessage());
            }
        }
    
        @Test
        public void test_sendToSlack_withNullWebhookUrls() {
            // Setup mock configuration with null webhook URLs
            ComponentUtil.setFessConfig(new MockFessConfig() {
                @Override
                public String getSlackWebhookUrls() {
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Wed Jan 14 14:29:07 GMT 2026
    - 20K bytes
    - Click Count (0)
  2. src/main/java/org/codelibs/fess/opensearch/config/exentity/WebConfig.java

                if (StringUtil.isNotBlank(getIncludedDocUrls())) {
                    final List<Pattern> urlPatterList = new ArrayList<>();
                    final String[] urls = getIncludedDocUrls().split("[\r\n]");
                    for (final String u : urls) {
                        final String v = systemHelper.normalizeConfigPath(u);
                        if (StringUtil.isNotBlank(v)) {
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Sat Jan 10 01:38:30 GMT 2026
    - 10.3K bytes
    - Click Count (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

    import org.codelibs.fess.crawler.service.UrlQueueService;
    
    import jakarta.annotation.Resource;
    
    /**
     * The Crawler class is the main class for web crawling. It manages the crawling process,
     * including adding URLs to the queue, filtering URLs, managing crawler threads,
     * and handling the overall crawling lifecycle.
     *
     * <p>It implements the Runnable interface to be executed in a separate thread,
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Mon Nov 24 03:59:47 GMT 2025
    - 17K bytes
    - Click Count (0)
  4. src/main/java/org/codelibs/fess/opensearch/config/bsentity/BsWebConfig.java

            this.updatedTime = value;
        }
    
        public String getUrls() {
            checkSpecifiedProperty("urls");
            return convertEmptyToNull(urls);
        }
    
        public void setUrls(String value) {
            registerModifiedProperty("urls");
            this.urls = value;
        }
    
        public String getUserAgent() {
            checkSpecifiedProperty("userAgent");
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Sat Mar 15 06:53:53 GMT 2025
    - 14.1K bytes
    - Click Count (0)
  5. src/main/java/org/codelibs/fess/util/GsaConfigParser.java

        /** XML element name for start URLs configuration. */
        protected static final String START_URLS = "start_urls";
    
        /** XML element name for good (included) URLs configuration. */
        protected static final String GOOD_URLS = "good_urls";
    
        /** XML element name for bad (excluded) URLs configuration. */
        protected static final String BAD_URLS = "bad_urls";
    
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 21.6K bytes
    - Click Count (0)
  6. src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java

            }
        }
    
        /**
         * Extracts anchor URLs from the given object and converts them to RequestData objects.
         * The input object can be either a single string or a list of strings representing URLs.
         *
         * @param obj the object containing anchor URLs (String or List of Strings)
         * @return a set of RequestData objects for the anchor URLs, or null if no valid URLs found
         */
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Thu Dec 11 09:47:03 GMT 2025
    - 19.5K bytes
    - Click Count (0)
  7. src/main/java/org/codelibs/fess/helper/WebFsIndexHelper.java

        }
    
        private static final Logger logger = LogManager.getLogger(WebFsIndexHelper.class);
    
        private static final String DISABLE_URL_ENCODE = "#DISABLE_URL_ENCODE";
    
        /**
         * Maximum number of URLs to access during crawling.
         */
        protected long maxAccessCount = Long.MAX_VALUE;
    
        /**
         * Interval time in milliseconds between crawling executions.
         */
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 25K bytes
    - Click Count (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

                logHelper.log(key, objs);
            }
        }
    
        /**
         * Runs the crawling process in a separate thread.
         * This method fetches URLs from the queue, accesses content, processes responses,
         * and extracts child URLs until the crawling process is done or no more URLs are available.
         */
        @Override
        public void run() {
            log(logHelper, LogType.START_THREAD, crawlerContext);
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Wed Dec 31 09:07:38 GMT 2025
    - 20.3K bytes
    - Click Count (0)
  9. src/test/java/org/codelibs/fess/ds/callback/FileListIndexUpdateCallbackImplTest.java

            for (int i = 0; i < threadCount; i++) {
                assertNull(exceptions[i], "Thread " + i + " threw exception");
            }
    
            // Verify all URLs were added
            synchronized (mockCallback) {
                assertEquals("All URLs should be added", threadCount * urlsPerThread, callback.deleteUrlList.size());
            }
        }
    
        /**
         * Test concurrent reads from deleteUrlList while synchronized.
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Wed Jan 14 14:29:07 GMT 2026
    - 19.7K bytes
    - Click Count (0)
  10. src/main/java/org/codelibs/fess/helper/CrawlingConfigHelper.java

        }
    
        /**
         * Retrieves a list of URLs that should be excluded from crawling based on failure counts.
         * URLs are excluded if they have failed more than the configured failure count threshold.
         * URLs can also be filtered by failure type using a regular expression pattern.
         *
         * @param configId the configuration ID to get excluded URLs for
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 19.5K bytes
    - Click Count (1)
Back to Top