Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 4 of 4 for TikaExtractor (0.18 sec)

  1. src/main/resources/crawler/extractor+tikaExtractor.xml

    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<component name="tikaExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.TikaExtractor">
    		<property name="maxCompressionRatio">2</property>
    		<property name="maxUncompressionSize">10000000</property>
    	</component>
    XML
    - Registered: Mon Apr 22 08:04:10 GMT 2024
    - Last Modified: Sun Aug 25 12:46:12 GMT 2019
    - 461 bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/helper/DocumentHelper.java

            }
            try {
                final TikaExtractor tikaExtractor = ComponentUtil.getComponent("tikaExtractor");
                if (tikaExtractor != null) {
                    tikaExtractor.setMaxAlphanumTermSize(getMaxAlphanumTermSize());
                    tikaExtractor.setMaxSymbolTermSize(getMaxSymbolTermSize());
                    tikaExtractor.setReplaceDuplication(isDuplicateTermRemoved());
                    tikaExtractor.setSpaceChars(getSpaceChars());
    Java
    - Registered: Mon Apr 22 08:04:10 GMT 2024
    - Last Modified: Thu Feb 22 01:37:57 GMT 2024
    - 12K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/crawler/transformer/FessStandardTransformer.java

            if (extractor == null) {
                extractor = ComponentUtil.getComponent("tikaExtractor");
                if (extractor == null) {
                    throw new FessSystemException("Could not find tikaExtractor.");
                }
            }
    
            if (logger.isDebugEnabled()) {
                logger.debug("url={}, extractor={}", responseData.getUrl(), extractor);
    Java
    - Registered: Mon Apr 22 08:04:10 GMT 2024
    - Last Modified: Thu Feb 22 01:37:57 GMT 2024
    - 2.4K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/crawler/transformer/AbstractFessFileTransformer.java

    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.impl.TikaExtractor;
    import org.codelibs.fess.crawler.transformer.impl.AbstractTransformer;
    import org.codelibs.fess.crawler.util.CrawlingParameterUtil;
    import org.codelibs.fess.es.config.exentity.CrawlingConfig;
    Java
    - Registered: Mon Apr 22 08:04:10 GMT 2024
    - Last Modified: Thu Feb 22 01:37:57 GMT 2024
    - 23.5K bytes
    - Viewed (0)
Back to top