Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 21 for batters (0.03 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

        /**
         * Test adding invalid regex include pattern
         */
        public void test_addInclude_invalidRegex() {
            String sessionId = "test-session-004";
            urlFilter.init(sessionId);
    
            // Invalid regex pattern should be handled gracefully
            urlFilter.addInclude(".*[invalid");
            urlFilter.addInclude("https://valid.com/.*");
    
            // Valid pattern should still work
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

         * The user-agent pattern in the directive is converted to a regular expression pattern,
         * where '*' is replaced with '.*' for pattern matching, and stored case-insensitively.
         *
         * @param directive The directive to add to the robots.txt rules
         */
        public void addDirective(final Directive directive) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

         * @return the parsed charset name, or null if not found
         */
        protected String parseCharset(final String content) {
            final Pattern pattern = Pattern.compile("; *charset *= *([a-zA-Z0-9\\-_]+)", Pattern.CASE_INSENSITIVE);
            final Matcher matcher = pattern.matcher(content);
            if (matcher.find()) {
                return matcher.group(1);
            }
            return null;
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 28.5K bytes
    - Viewed (0)
  4. README.md

    crawler.crawlerContext.setDefaultIntervalTime(1000); // 1 second
    ```
    
    ### URL Filtering
    
    ```java
    // Include patterns
    crawler.urlFilter.addInclude("https://example.com/.*");
    crawler.urlFilter.addInclude(".*\\.pdf$");
    
    // Exclude patterns  
    crawler.urlFilter.addExclude(".*\\.js$");
    crawler.urlFilter.addExclude(".*login.*");
    ```
    
    ## Supported Protocols and Formats
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/form/FormScheme.java

        }
    
        /**
         * Extracts the token value from the content using the given pattern.
         * @param tokenPattern The regex pattern.
         * @param content The content to search.
         * @return The extracted token value.
         */
        protected String getTokenValue(final String tokenPattern, final String content) {
            final Matcher matcher = Pattern.compile(tokenPattern).matcher(content);
            if (matcher.find()) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.3K bytes
    - Viewed (1)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java

        }
    
        /**
         * Gets the pattern for extracting charset from meta tags.
         *
         * @return the meta charset pattern
         */
        public Pattern getMetaCharsetPattern() {
            return metaCharsetPattern;
        }
    
        /**
         * Sets the pattern for extracting charset from meta tags.
         *
         * @param metaCharsetPattern the meta charset pattern to set
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/AbstractRuleTest.java

            ConditionalAbstractRule conditionalRule = new ConditionalAbstractRule();
            conditionalRule.crawlerContainer = container;
            conditionalRule.setRuleId("conditionalRule");
    
            // Set patterns
            conditionalRule.setUrlPattern("https?://.*\\.example\\.com/.*");
            conditionalRule.setMimeTypePattern("text/.*");
    
            // Test matching
            ResponseData responseData1 = new ResponseData();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 21.9K bytes
    - Viewed (0)
  8. README.md

    PopularWordsResponse popularWords = suggester.popularWords()
        .setSize(20)                    // top 20 words
        .setQuery("tech*")              // filter pattern
        .execute()
        .getResponse();
    
    popularWords.getItems().forEach(item -> {
        System.out.println("Popular: " + item.getText() + 
                          " (freq: " + item.getDocFreq() + ")");
    });
    ```
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sun Aug 31 03:31:14 UTC 2025
    - 12.1K bytes
    - Viewed (1)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java

         */
        public XpathTransformer() {
            super();
        }
    
        private static final Logger logger = LogManager.getLogger(XpathTransformer.class);
    
        private static final Pattern SPACE_PATTERN = Pattern.compile("\\s+", Pattern.MULTILINE);
    
        /**
         * A map of field rules, where the key is the field name and the value is the XPath expression.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.1K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/suggest/settings/ArraySettings.java

    import java.time.ZonedDateTime;
    import java.time.format.DateTimeFormatter;
    import java.util.Arrays;
    import java.util.Base64;
    import java.util.HashMap;
    import java.util.Locale;
    import java.util.Map;
    import java.util.regex.Pattern;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.CoreLibConstants;
    import org.codelibs.core.lang.StringUtil;
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 15.6K bytes
    - Viewed (0)
Back to top