- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 19 for caching (0.05 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java
* It uses XPath expressions to extract text content from HTML documents. * <p> * This class provides methods to configure the XPath expressions, parser features, and properties. * It also includes caching mechanism for XPathAPI instances to improve performance. * </p> * <p> * The extracted text is obtained from the nodes selected by the {@code targetNodePath} XPath expression.Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java
/** * Returns the most specific directive matching the given user agent. * The method finds the longest matching user agent pattern in the directives, * excluding the general "*" pattern which matches all bots. * * @param userAgent the user agent string to match against directives, * can be null (treated as empty string) * @return the most specific matching directive, or null if no directive matchesRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/RuleManagerTest.java
TestRule rule = new TestRule("rule1", true); ruleManager.addRule(rule); assertFalse(ruleManager.hasRule(null)); } /** * Test getRule with matching rule */ public void test_getRule_matching() { TestRule rule1 = new TestRule("rule1", false); TestRule rule2 = new TestRule("rule2", true); TestRule rule3 = new TestRule("rule3", false);
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 23.8K bytes - Viewed (0) -
fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/AbstractCrawlerService.java
} } /** * Gets the count of documents matching the search criteria. * * @param callback The callback to configure the search request. * @return The number of matching documents. */ public int getCount(final Consumer<SearchRequestBuilder> callback) { final TotalHits totalHits = getClient().get(c -> {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 34.2K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/AbstractRuleTest.java
conditionalRule.setMimeTypePattern("text/.*"); // Test matching ResponseData responseData1 = new ResponseData(); responseData1.setUrl("http://www.example.com/page"); responseData1.setMimeType("text/html"); assertTrue(conditionalRule.match(responseData1)); // Test non-matching URL ResponseData responseData2 = new ResponseData();
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Wed Sep 03 14:42:53 UTC 2025 - 21.9K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/RuleTest.java
// Clear conditions rule.clearConditions(); // Should match after clearing conditions assertTrue(rule.match(responseData)); } /** * Test rule matching with various ResponseData states */ public void test_matchWithVariousResponseDataStates() { ConfigurableRule rule = new ConfigurableRule(); rule.setRuleId("stateRule");Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Wed Sep 03 14:42:53 UTC 2025 - 22.7K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java
for (int i = 0; i < 1000; i++) { urlFilter.addInclude("https://site" + i + ".com/.*"); urlFilter.addExclude(".*\\.exclude" + i + "$"); } // Test matching performance assertTrue(urlFilter.match("https://site500.com/page")); assertFalse(urlFilter.match("https://site500.com/file.exclude500")); assertFalse(urlFilter.match("https://unknown.com/page"));
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Wed Sep 03 14:42:53 UTC 2025 - 19K bytes - Viewed (0) -
fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchDataService.java
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 10.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java
*/ @Override public void close() { clientFactory.close(); } /** * Adds an include filter for URLs. * Only URLs matching this regular expression will be crawled. * @param regexp The regular expression for the include filter. */ public void addIncludeFilter(final String regexp) { if (StringUtil.isNotBlank(regexp)) {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 14K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/exception/CrawlerSystemExceptionTest.java
assertEquals(original.getCause().getClass(), deserialized.getCause().getClass()); } /** * Test throwing and catching the exception */ public void test_throwAndCatch() { try { throw new CrawlerSystemException("Test throw"); } catch (CrawlerSystemException e) {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Wed Sep 03 14:42:53 UTC 2025 - 20K bytes - Viewed (0)