Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 16 for tika (0.02 sec)

  1. pom.xml

    			<groupId>com.ibm.icu</groupId>
    			<artifactId>icu4j</artifactId>
    			<version>${icu4j.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.apache.tika</groupId>
    			<artifactId>tika-langdetect-optimaize</artifactId>
    			<version>${tika.version}</version>
    			<exclusions>
    				<exclusion>
    					<groupId>javax.annotation</groupId>
    					<artifactId>javax.annotation-api</artifactId>
    				</exclusion>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Sep 04 05:22:58 UTC 2025
    - 49.6K bytes
    - Viewed (0)
  2. src/main/resources/fess.xml

    		<property name="valueSeparator">"\\n"</property>
    		<property name="roleSeparator">","</property>
    		 -->
    	</component>
    	<component name="tikaConfig" class="org.apache.tika.config.TikaConfig">
    		<arg>org.codelibs.fess.util.ResourceUtil.getConfOrClassesPath("tika.xml")</arg>
    	</component>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sun Jul 28 09:03:48 UTC 2024
    - 5.2K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/helper/LanguageHelper.java

    import java.util.Arrays;
    import java.util.Map;
    import java.util.stream.Collectors;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.apache.tika.language.detect.LanguageDetector;
    import org.apache.tika.language.detect.LanguageResult;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.mylasta.direction.FessConfig;
    import org.codelibs.fess.util.ComponentUtil;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 6.9K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/crawler/transformer/FessStandardTransformer.java

        public Logger getLogger() {
            return logger;
        }
    
        /**
         * Gets the appropriate extractor for the given response data.
         * Selects an extractor based on the MIME type or falls back to the Tika extractor.
         *
         * @param responseData the response data containing the document to extract
         * @return the extractor instance for processing the document
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 3.8K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/job/CrawlJob.java

            } else {
                cmdList.add("-Dfess.log.level=" + logLevel);
                if ("debug".equalsIgnoreCase(logLevel)) {
                    cmdList.add("-Dorg.apache.tika.service.error.warn=true");
                }
            }
            stream(fessConfig.getJvmCrawlerOptionsAsArray())
                    .of(stream -> stream.filter(StringUtil::isNotBlank).forEach(value -> cmdList.add(value)));
    
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 19.6K bytes
    - Viewed (0)
  6. src/main/resources/fess_config.properties

    # Type of hot thread monitoring (e.g., cpu).
    crawler.hotthread.type=cpu
    # Metadata fields to exclude from document content.
    crawler.metadata.content.excludes=resourceName,X-Parsed-By,Content-Encoding.*,Content-Type.*,X-TIKA.*,X-FESS.*
    # Mapping for document metadata names.
    crawler.metadata.name.mapping=\
    title=title:string\n\
    Title=title:string\n\
    dc:title=title:string\n\
    
    # html
    
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sat Jul 05 14:45:37 UTC 2025
    - 54.7K bytes
    - Viewed (0)
  7. src/main/resources/fess_indices/_aws/fess.json

    "taču", "nu", "pat", "tiklab", "iekšpus", "nedz", "tik", "nevis", "turpretim", "jeb", "iekam", "iekām", "iekāms", "kolīdz", "līdzko", "tiklīdz", "jebšu", "tālab", "tāpēc", "nekā", "itin", "jā", "jau", "jel", "nē", "nezin", "tad", "tikai", "vis", "tak", "iekams", "vien", "# modal verbs", "būt  ", "biju ", "biji", "bija", "bijām", "bijāt", "esmu", "esi", "esam", "esat ", "būšu     ", "būsi", "būs", "būsim", "būsiet", "tikt", "tiku", "tiki", "tika", "tikām", "tikāt", "tieku", "tiec", "tiek", "tiekam",...
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sat Jun 14 00:36:40 UTC 2025
    - 117.3K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java

        /** The key of the configuration. e.g. cpu */
        String CRAWLER_HOTTHREAD_TYPE = "crawler.hotthread.type";
    
        /** The key of the configuration. e.g. resourceName,X-Parsed-By,Content-Encoding.*,Content-Type.*,X-TIKA.*,X-FESS.* */
        String CRAWLER_METADATA_CONTENT_EXCLUDES = "crawler.metadata.content.excludes";
    
        /** The key of the configuration. e.g. title=title:string<br>
         * Title=title:string<br>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 525.6K bytes
    - Viewed (1)
  9. guava-tests/test/com/google/common/base/SplitterTest.java

            COMMA_SPLITTER
                .trimResults()
                .withKeyValueSeparator(Splitter.on(':').trimResults())
                .split("boy  : tom , girl: tina , cat  : kitty , dog: tommy ");
        ImmutableMap<String, String> expected =
            ImmutableMap.of("boy", "tom", "girl", "tina", "cat", "kitty", "dog", "tommy");
        assertThat(m).isEqualTo(expected);
        assertThat(m.entrySet()).containsExactlyElementsIn(expected.entrySet()).inOrder();
    Registered: Fri Sep 05 12:43:10 UTC 2025
    - Last Modified: Thu Aug 07 16:05:33 UTC 2025
    - 29.5K bytes
    - Viewed (0)
  10. src/main/resources/fess_indices/fess/fi/stopwords.txt

    ketä
    kenessä
    kenestä
    keneen
    kenellä
    keneltä
    kenelle
    kenenä
    keneksi
    ketkä
    keiden
    ketkä
    keitä
    keissä
    keistä
    keihin
    keillä
    keiltä
    keille
    keinä
    keiksi
    mikä
    minkä
    minkä
    mitä
    missä
    mistä
    mihin
    millä
    miltä
    mille
    minä
    miksi
    mitkä
    joka
    jonka
    jota
    jossa
    josta
    johon
    jolla
    jolta
    jolle
    jona
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Mon Nov 27 12:59:36 UTC 2023
    - 1.7K bytes
    - Viewed (0)
Back to top