- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 12 for urlFilter (0.1 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/UrlFilter.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.filter; /** * UrlFilter checks if a given url is a target one. * * @author shinsuke * */ public interface UrlFilter { /** * Initialize a url filter by sessionId. * * @param sessionId Session ID */ void init(String sessionId); /**
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 1.6K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
crawler.crawlerContext.setMaxThreadCheckCount(3); crawler.crawlerContext.setMaxAccessCount(maxCount); crawler.crawlerContext.setNumOfThread(numOfThread); crawler.urlFilter.addInclude(url + ".*"); crawler.urlFilter.addExclude(url + "/dir1/.*"); final String sessionId = crawler.execute(); assertEquals(maxCount, dataService.getCount(sessionId)); dataService.delete(sessionId); }
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 18K bytes - Viewed (0) -
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
crawler.crawlerContext.setMaxThreadCheckCount(3); crawler.crawlerContext.setMaxAccessCount(maxCount); crawler.crawlerContext.setNumOfThread(numOfThread); crawler.urlFilter.addInclude(url + ".*"); crawler.urlFilter.addExclude(url + "/dir1/.*"); final String sessionId = crawler.execute(); assertEquals(maxCount, dataService.getCount(sessionId)); dataService.delete(sessionId); }
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:47:32 UTC 2024 - 11.9K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImplTest.java
assertEquals(0, urlFilter.cachedIncludeSet.size()); assertEquals(0, urlFilter.cachedExcludeSet.size()); urlFilter.addExclude(".*[test.*"); assertEquals(0, urlFilter.cachedIncludeSet.size()); assertEquals(0, urlFilter.cachedExcludeSet.size()); final String sessionId = "id1"; urlFilter.init(sessionId); assertEquals(0, urlFilter.cachedIncludeSet.size());
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 6.9K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/client/http/HcHttpClientTest.java
.singleton("urlFilter", UrlFilterImpl.class)// .singleton("robotsTxtHelper", RobotsTxtHelper.class)// .singleton("httpClient", HcHttpClient.class); httpClient = container.getComponent("httpClient"); urlFilter = container.getComponent("urlFilter"); } public void test_doGet() {
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu May 09 09:28:25 UTC 2024 - 8.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java
} public void setUrlFilter(final UrlFilter urlFilter) { this.urlFilter = urlFilter; } public RuleManager getRuleManager() { return ruleManager; } public void setRuleManager(final RuleManager ruleManager) { this.ruleManager = ruleManager; } public IntervalController getIntervalController() { return intervalController; }
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:47:32 UTC 2024 - 7.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImpl.java
import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.filter.UrlFilter; import org.codelibs.fess.crawler.service.UrlFilterService; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import jakarta.annotation.Resource; /** * @author shinsuke * */ public class UrlFilterImpl implements UrlFilter { private static final Logger logger = LoggerFactory.getLogger(UrlFilterImpl.class);
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:47:32 UTC 2024 - 7.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java
return status; } public void setStatus(final CrawlerStatus status) { this.status = status; } public UrlFilter getUrlFilter() { return urlFilter; } public void setUrlFilter(final UrlFilter urlFilter) { this.urlFilter = urlFilter; } public RuleManager getRuleManager() { return ruleManager; }
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sat Oct 12 01:40:57 UTC 2024 - 4.5K bytes - Viewed (0) -
fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
crawler.addUrl(url); crawler.getCrawlerContext().setMaxAccessCount(maxCount); crawler.getCrawlerContext().setNumOfThread(numOfThread); crawler.urlFilter.addInclude(url + ".*"); final String sessionId = crawler.execute(); assertEquals(maxCount, dataService.getCount(sessionId)); dataService.delete(sessionId); } finally {
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Nov 07 04:44:10 UTC 2024 - 7.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java
final List<UrlQueue<?>> childList = childUrlList.stream().filter(d -> StringUtil.isNotBlank(d.getUrl()) && urlSet.add(d.getUrl() + "\n" + d.getMetaData()) && crawlerContext.urlFilter.match(d.getUrl())).map(d -> { final UrlQueue<?> uq = crawlerContainer.getComponent("urlQueue"); uq.setCreateTime(SystemUtil.currentTimeMillis()); uq.setDepth(depth);
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sat Oct 12 01:41:37 UTC 2024 - 15.5K bytes - Viewed (0)