Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 22 for Filter (0.09 sec)

  1. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/entity/OpenSearchUrlFilter.java

            this.sessionId = sessionId;
        }
    
        /**
         * Returns the filter type.
         * @return The filter type.
         */
        public String getFilterType() {
            return filterType;
        }
    
        /**
         * Sets the filter type.
         * @param filterType The filter type.
         */
        public void setFilterType(final String filterType) {
            this.filterType = filterType;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.6K bytes
    - Viewed (0)
  2. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/util/OpenSearchCrawlerConfig.java

            this.dataIndex = dataIndex;
        }
    
        /**
         * Returns the filter index name.
         * @return The filter index name.
         */
        public String getFilterIndex() {
            return filterIndex;
        }
    
        /**
         * Sets the filter index name.
         * @param filterIndex The filter index name.
         */
        public void setFilterIndex(final String filterIndex) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5.4K bytes
    - Viewed (10)
  3. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlFilterService.java

        /**
         * Field name for filter type.
         */
        private static final String FILTER_TYPE = "filterType";
    
        /**
         * Filter type for include filters.
         */
        private static final String INCLUDE = "include";
    
        /**
         * Filter type for exclude filters.
         */
        private static final String EXCLUDE = "exclude";
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

     * <ol>
     *   <li>Initialization: Sets up the crawler context and initializes the URL filter.</li>
     *   <li>Thread Creation: Creates a group of crawler threads to perform the actual crawling.</li>
     *   <li>Execution: Starts the crawler threads and waits for them to complete.</li>
     *   <li>Cleanup: Deletes the crawled data and clears the URL filter.</li>
     * </ol>
     *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImpl.java

     * It also provides methods to initialize the filter with a session ID, clear the filter,
     * match a URL against the defined patterns, and process a URL to add include or exclude patterns based on predefined filtering patterns.
     *
     */
    /**
     * This class is an implementation of a URL filter.
     */
    public class UrlFilterImpl implements UrlFilter {
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java

        public void setStatus(final CrawlerStatus status) {
            this.status = status;
        }
    
        /**
         * Returns the URL filter.
         * @return The UrlFilter.
         */
        public UrlFilter getUrlFilter() {
            return urlFilter;
        }
    
        /**
         * Sets the URL filter.
         * @param urlFilter The UrlFilter.
         */
        public void setUrlFilter(final UrlFilter urlFilter) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.9K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.filter;
    
    import org.codelibs.fess.crawler.container.StandardCrawlerContainer;
    import org.codelibs.fess.crawler.filter.impl.UrlFilterImpl;
    import org.codelibs.fess.crawler.helper.MemoryDataHelper;
    import org.codelibs.fess.crawler.service.impl.DataServiceImpl;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  8. README.md

        client.setConnectionTimeout(30000);
        client.setMaxConnections(100);
    });
    
    // Configure URL filtering
    container.singleton("urlFilter", UrlFilterImpl.class, filter -> {
        filter.addInclude("https://example.com/.*");
        filter.addExclude(".*\\.(css|js|png|jpg|gif)$");
    });
    
    // Configure content extraction
    container.singleton("tikaExtractor", TikaExtractor.class);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  9. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/http/HcHttpClientTest.java

    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.codelibs.fess.crawler.filter.UrlFilter;
    import org.codelibs.fess.crawler.filter.impl.UrlFilterImpl;
    import org.codelibs.fess.crawler.helper.MemoryDataHelper;
    import org.codelibs.fess.crawler.helper.RobotsTxtHelper;
    import org.codelibs.fess.crawler.helper.impl.MimeTypeHelperImpl;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.7K bytes
    - Viewed (0)
  10. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueService.java

            SearchResponse response = getClient().get(c -> c.prepareSearch(index)
                    .setScroll(new TimeValue(scrollTimeout))
                    .setQuery(QueryBuilders.boolQuery().filter(QueryBuilders.termQuery(SESSION_ID, oldSessionId)))
                    .setSize(scrollSize)
                    .execute());
            String scrollId = response.getScrollId();
            try {
                while (scrollId != null) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 17K bytes
    - Viewed (1)
Back to top