Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 9 of 9 for fighters (0.04 sec)

  1. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlFilterService.java

        private static final String FILTER_TYPE = "filterType";
    
        /**
         * Filter type for include filters.
         */
        private static final String INCLUDE = "include";
    
        /**
         * Filter type for exclude filters.
         */
        private static final String EXCLUDE = "exclude";
    
        /**
         * Cache for include filters.
         */
        protected LoadingCache<String, List<Pattern>> includeFilterCache;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/UrlFilterService.java

     */
    package org.codelibs.fess.crawler.service;
    
    import java.util.List;
    import java.util.regex.Pattern;
    
    /**
     * Service interface for managing URL filters.
     * Provides methods to add and remove include/exclude URL filters,
     * as well as retrieve the patterns of these filters.
     */
    public interface UrlFilterService {
    
        /**
         * Adds a URL to the include filter list for the specified session.
         *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 3.1K bytes
    - Viewed (0)
  3. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/entity/OpenSearchUrlFilter.java

    import java.io.IOException;
    
    import org.opensearch.core.xcontent.ToXContent;
    import org.opensearch.core.xcontent.XContentBuilder;
    
    /**
     * OpenSearchUrlFilter is an entity for URL filters in OpenSearch.
     */
    public class OpenSearchUrlFilter implements ToXContent {
    
        /**
         * Creates a new instance of OpenSearchUrlFilter.
         */
        public OpenSearchUrlFilter() {
            // NOP
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.6K bytes
    - Viewed (0)
  4. README.md

    - **StorageClient**: Cloud storage integration
    
    #### Content Processing Pipeline
    - **Extractors**: Content extraction from various formats
    - **Transformers**: Data transformation and enrichment
    - **Filters**: URL filtering with regex patterns
    - **Rules**: Content processing rules and validation
    
    ## Building and Testing
    
    ### Build Commands
    
    ```bash
    # Build all modules
    mvn clean install
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

            assertFalse(urlFilter.match("https://other.com/page"));
    
            // Clear the filter
            urlFilter.clear();
    
            // After clear, all URLs should match (no filters applied)
            assertTrue(urlFilter.match("https://example.com/page"));
            assertTrue(urlFilter.match("https://other.com/page"));
            assertTrue(urlFilter.match("https://any.com/image.jpg"));
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

     *   <li>Extracting text from metadata if the main content extraction fails</li>
     *   <li>Reading content as plain text if all other methods fail</li>
     *   <li>Applying post-extraction filters</li>
     *   <li>Handling Tika exceptions, including zip bomb exceptions</li>
     * </ul>
     *
     * <p>
     * The class also supports configuration options such as:
     * </p>
     * <ul>
     *   <li>Output encoding</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

     *   <li>Cleanup: Deletes the crawled data and clears the URL filter.</li>
     * </ol>
     *
     * <p>The crawler can be configured with various parameters, such as the number of threads,
     * the maximum depth of crawling, and URL filters.
     *
     * <p>Example usage:
     * <pre>
     *   Crawler crawler = new Crawler();
     *   crawler.addUrl("http://example.com/");
     *   crawler.execute();
     *   crawler.close();
     * </pre>
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  8. fess-crawler/src/test/resources/ajax/js/jquery-2.1.1.min.js

    this.each(function(c){n(this).wrapAll(b?a.call(this,c):a)})},unwrap:function(){return this.parent().each(function(){n.nodeName(this,"body")||n(this).replaceWith(this.childNodes)}).end()}}),n.expr.filters.hidden=function(a){return a.offsetWidth<=0&&a.offsetHeight<=0},n.expr.filters.visible=function(a){return!n.expr.filters.hidden(a)};var wc=/%20/g,xc=/\[\]$/,yc=/\r?\n/g,zc=/^(?:submit|button|image|reset|file)$/i,Ac=/^(?:input|select|textarea|keygen)/i;function Bc(a,b,c,d){var e;if(n.isArray(b))n.each(b,fun...
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 82.3K bytes
    - Viewed (0)
  9. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

      </mime-type>
    
      <mime-type type="application/x-tika-msworks-spreadsheet">
        <glob pattern="*.xlr"/>
        <sub-class-of type="application/vnd.ms-excel"/>
        <!-- this has to be highter than the Excel match -->
        <magic priority="60">
          <match value="0xd0cf11e0a1b11ae1" type="string" offset="0:8">
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (2)
Back to top