- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 21 for batters (0.03 sec)
-
fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java
/** * Test adding invalid regex include pattern */ public void test_addInclude_invalidRegex() { String sessionId = "test-session-004"; urlFilter.init(sessionId); // Invalid regex pattern should be handled gracefully urlFilter.addInclude(".*[invalid"); urlFilter.addInclude("https://valid.com/.*"); // Valid pattern should still workRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Wed Sep 03 14:42:53 UTC 2025 - 19K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java
* The user-agent pattern in the directive is converted to a regular expression pattern, * where '*' is replaced with '.*' for pattern matching, and stored case-insensitively. * * @param directive The directive to add to the robots.txt rules */ public void addDirective(final Directive directive) {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java
* @return the parsed charset name, or null if not found */ protected String parseCharset(final String content) { final Pattern pattern = Pattern.compile("; *charset *= *([a-zA-Z0-9\\-_]+)", Pattern.CASE_INSENSITIVE); final Matcher matcher = pattern.matcher(content); if (matcher.find()) { return matcher.group(1); } return null; } /**Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 28.5K bytes - Viewed (0) -
README.md
crawler.crawlerContext.setDefaultIntervalTime(1000); // 1 second ``` ### URL Filtering ```java // Include patterns crawler.urlFilter.addInclude("https://example.com/.*"); crawler.urlFilter.addInclude(".*\\.pdf$"); // Exclude patterns crawler.urlFilter.addExclude(".*\\.js$"); crawler.urlFilter.addExclude(".*login.*"); ``` ## Supported Protocols and Formats
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Aug 31 05:32:52 UTC 2025 - 15.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/form/FormScheme.java
} /** * Extracts the token value from the content using the given pattern. * @param tokenPattern The regex pattern. * @param content The content to search. * @return The extracted token value. */ protected String getTokenValue(final String tokenPattern, final String content) { final Matcher matcher = Pattern.compile(tokenPattern).matcher(content); if (matcher.find()) {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 14.3K bytes - Viewed (1) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java
} /** * Gets the pattern for extracting charset from meta tags. * * @return the meta charset pattern */ public Pattern getMetaCharsetPattern() { return metaCharsetPattern; } /** * Sets the pattern for extracting charset from meta tags. * * @param metaCharsetPattern the meta charset pattern to set */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10.3K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/AbstractRuleTest.java
ConditionalAbstractRule conditionalRule = new ConditionalAbstractRule(); conditionalRule.crawlerContainer = container; conditionalRule.setRuleId("conditionalRule"); // Set patterns conditionalRule.setUrlPattern("https?://.*\\.example\\.com/.*"); conditionalRule.setMimeTypePattern("text/.*"); // Test matching ResponseData responseData1 = new ResponseData();
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Wed Sep 03 14:42:53 UTC 2025 - 21.9K bytes - Viewed (0) -
README.md
PopularWordsResponse popularWords = suggester.popularWords() .setSize(20) // top 20 words .setQuery("tech*") // filter pattern .execute() .getResponse(); popularWords.getItems().forEach(item -> { System.out.println("Popular: " + item.getText() + " (freq: " + item.getDocFreq() + ")"); }); ```
Registered: Fri Sep 19 09:08:11 UTC 2025 - Last Modified: Sun Aug 31 03:31:14 UTC 2025 - 12.1K bytes - Viewed (1) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java
*/ public XpathTransformer() { super(); } private static final Logger logger = LogManager.getLogger(XpathTransformer.class); private static final Pattern SPACE_PATTERN = Pattern.compile("\\s+", Pattern.MULTILINE); /** * A map of field rules, where the key is the field name and the value is the XPath expression. */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 13.1K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/suggest/settings/ArraySettings.java
import java.time.ZonedDateTime; import java.time.format.DateTimeFormatter; import java.util.Arrays; import java.util.Base64; import java.util.HashMap; import java.util.Locale; import java.util.Map; import java.util.regex.Pattern; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.core.CoreLibConstants; import org.codelibs.core.lang.StringUtil;
Registered: Fri Sep 19 09:08:11 UTC 2025 - Last Modified: Thu Aug 07 02:41:28 UTC 2025 - 15.6K bytes - Viewed (0)