- Sort Score
- Result 10 results
- Languages All
Results 11 - 13 of 13 for tikaExtractor (0.06 sec)
-
README.md
}); // Configure content extraction container.singleton("tikaExtractor", TikaExtractor.class); container.singleton("extractorFactory", ExtractorFactory.class, factory -> { factory.addExtractor("text/html", container.getComponent("tikaExtractor")); factory.addExtractor("application/pdf", container.getComponent("tikaExtractor")); }); Crawler crawler = container.getComponent("crawler");
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Aug 31 05:32:52 UTC 2025 - 15.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java
private String filename; /** Cache file size threshold in bytes */ private int cacheFileSize = 1_000_000; /** Name of the extractor to use */ private String extractorName = "tikaExtractor"; /** Maximum content length allowed */ private long maxContentLength = -1; /** * Constructs a new ExtractorBuilder. * * @param crawlerContainer the crawler containerRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10.1K bytes - Viewed (0) -
fess-crawler-lasta/src/main/resources/crawler/extractor.xml
<!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" "http://dbflute.org/meta/lastadi10.dtd"> <components namespace="fessCrawler"> <include path="crawler/container.xml" /> <component name="tikaExtractor" class="org.codelibs.fess.crawler.extractor.impl.TikaExtractor"> <property name="maxCompressionRatio">1</property> <property name="maxUncompressionSize">10000000</property> </component> <component name="msWordExtractor"
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Aug 01 21:40:30 UTC 2020 - 49K bytes - Viewed (0)