- Sort Score
- Num 10 results
- Language All
Results 11 - 15 of 15 for addExtractor (0.04 seconds)
-
fess-crawler-lasta/src/main/resources/crawler/extractor.xml
<postConstruct name="addExtractor"> <arg>[ "application/pdf" ]</arg> <arg>pdfExtractor</arg> </postConstruct> <postConstruct name="addExtractor"> <arg>[ "application/x-lha", "application/x-lharc" ]</arg> <arg>lhaExtractor</arg> </postConstruct> <postConstruct name="addExtractor"> <arg>[ "message/rfc822" ]</arg> <arg>emlExtractor</arg>
Created: Sat Dec 20 11:21:39 GMT 2025 - Last Modified: Sun Nov 23 03:46:53 GMT 2025 - 50.1K bytes - Click Count (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
TikaExtractor tikaExtractor = container.getComponent("tikaExtractor"); factory.addExtractor("text/plain", tikaExtractor); factory.addExtractor("text/html", tikaExtractor); })// .singleton("httpClient", HcHttpClient.class)//
Created: Sat Dec 20 11:21:39 GMT 2025 - Last Modified: Tue Nov 11 13:40:14 GMT 2025 - 25.8K bytes - Click Count (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractorTest.java
.<ExtractorFactory> singleton("extractorFactory", ExtractorFactory.class, factory -> { TikaExtractor tikaExtractor = container.getComponent("tikaExtractor"); factory.addExtractor("application/pdf", tikaExtractor); }); emlExtractor = container.getComponent("emlExtractor"); } public void test_getText() throws IOException {
Created: Sat Dec 20 11:21:39 GMT 2025 - Last Modified: Thu Aug 07 02:55:08 GMT 2025 - 4.6K bytes - Click Count (1) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractExtractor.java
if (keyList == null || keyList.isEmpty()) { throw new IllegalArgumentException("keyList must not be null or empty."); } getExtractorFactory().addExtractor(keyList, this); } /** * Returns the MimeTypeHelper instance from the CrawlerContainer. * @return The MimeTypeHelper instance. */ protected MimeTypeHelper getMimeTypeHelper() {
Created: Sat Dec 20 11:21:39 GMT 2025 - Last Modified: Wed Nov 19 08:55:01 GMT 2025 - 4.6K bytes - Click Count (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractorTest.java
TikaExtractor tikaExtractor = container.getComponent("tikaExtractor"); factory.addExtractor("text/plain", tikaExtractor); factory.addExtractor("text/html", tikaExtractor); })// ; tikaExtractor = container.getComponent("tikaExtractor"); } public void test_getTika_text() {
Created: Sat Dec 20 11:21:39 GMT 2025 - Last Modified: Thu Aug 07 02:55:08 GMT 2025 - 30.6K bytes - Click Count (0)