- Sort Score
- Num 10 results
- Language All
Results 1 - 2 of 2 for UrlFilterImpl (0.05 seconds)
-
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
import java.io.File; import org.codelibs.core.io.ResourceUtil; import org.codelibs.fess.crawler.container.CrawlerContainer; import org.codelibs.fess.crawler.entity.UrlQueue; import org.codelibs.fess.crawler.filter.impl.UrlFilterImpl; import org.codelibs.fess.crawler.service.DataService; import org.codelibs.fess.crawler.service.UrlQueueService; import org.codelibs.fess.crawler.transformer.impl.FileTransformer;
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Thu Jan 15 01:11:43 GMT 2026 - 13.1K bytes - Click Count (0) -
README.md
client.setUserAgent("MyBot/1.0"); client.setConnectionTimeout(30000); client.setMaxConnections(100); }); // Configure URL filtering container.singleton("urlFilter", UrlFilterImpl.class, filter -> { filter.addInclude("https://example.com/.*"); filter.addExclude(".*\\.(css|js|png|jpg|gif)$"); }); // Configure content extraction
Created: Sun Apr 12 03:50:13 GMT 2026 - Last Modified: Sun Aug 31 05:32:52 GMT 2025 - 15.3K bytes - Click Count (0)