Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 35 for tika (0.02 sec)

  1. src/main/resources/tika.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <properties>
      <parsers>
        <parser class="org.apache.tika.parser.DefaultParser">
          <parser-exclude class="org.apache.tika.parser.ocr.TesseractOCRParser"/>
        </parser>
      </parsers>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Mon Feb 24 12:59:41 UTC 2020
    - 241 bytes
    - Viewed (0)
  2. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

      <!--  an OLE2 (application/x-tika-msoffice) container. -->
      <!--  The are logically subclasses of (application/x-tika-ooxml),
            but their containers are literally subclasses
            of (application/x-tika-msoffice) -->
      <mime-type type="application/x-tika-ooxml-protected">
        <sub-class-of type="application/x-tika-msoffice"/>
        <_comment>Password Protected OOXML File</_comment>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ExtractData.java

    import java.util.Map;
    import java.util.Set;
    
    import org.apache.tika.metadata.ClimateForcast;
    import org.apache.tika.metadata.CreativeCommons;
    import org.apache.tika.metadata.Geographic;
    import org.apache.tika.metadata.HttpHeaders;
    import org.apache.tika.metadata.Message;
    import org.apache.tika.metadata.TIFF;
    import org.apache.tika.metadata.TikaCoreProperties;
    import org.apache.tika.metadata.TikaMimeKeys;
    
    /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 3.8K bytes
    - Viewed (0)
  4. fess-crawler/pom.xml

    			<artifactId>tika-parser-html-module</artifactId>
    			<version>${tika.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.apache.tika</groupId>
    			<artifactId>tika-parser-image-module</artifactId>
    			<version>${tika.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.apache.tika</groupId>
    			<artifactId>tika-parser-mail-module</artifactId>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.3K bytes
    - Viewed (0)
  5. src/main/resources/fess_indices/fess/lv/stopwords.txt

    esam
    esat 
    būšu     
    būsi
    būs
    būsim
    būsiet
    tikt
    tiku
    tiki
    tika
    tikām
    tikāt
    tieku
    tiec
    tiek
    tiekam
    tiekat
    tikšu
    tiks
    tiksim
    tiksiet
    tapt
    tapi
    tapāt
    topat
    tapšu
    tapsi
    taps
    tapsim
    tapsiet
    kļūt
    kļuvu
    kļuvi
    kļuva
    kļuvām
    kļuvāt
    kļūstu
    kļūsti
    kļūst
    kļūstam
    kļūstat
    kļūšu
    kļūsi
    kļūs
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 19 06:31:02 UTC 2018
    - 1.2K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/MimeTypeHelperImpl.java

    import java.io.BufferedInputStream;
    import java.io.IOException;
    import java.io.InputStream;
    import java.util.HashMap;
    import java.util.Map;
    
    import org.apache.tika.metadata.Metadata;
    import org.apache.tika.mime.MediaType;
    import org.apache.tika.mime.MimeTypes;
    import org.apache.tika.mime.MimeTypesFactory;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.entity.ExtractData;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

    import org.apache.logging.log4j.Logger;
    import org.apache.tika.config.TikaConfig;
    import org.apache.tika.detect.Detector;
    import org.apache.tika.exception.TikaException;
    import org.apache.tika.extractor.EmbeddedDocumentExtractor;
    import org.apache.tika.extractor.ParsingEmbeddedDocumentExtractor;
    import org.apache.tika.io.TemporaryResources;
    import org.apache.tika.io.TikaInputStream;
    import org.apache.tika.metadata.Metadata;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  8. src/main/resources/fess.xml

    		<property name="valueSeparator">"\\n"</property>
    		<property name="roleSeparator">","</property>
    		 -->
    	</component>
    	<component name="tikaConfig" class="org.apache.tika.config.TikaConfig">
    		<arg>org.codelibs.fess.util.ResourceUtil.getConfOrClassesPath("tika.xml")</arg>
    	</component>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sun Jul 28 09:03:48 UTC 2024
    - 5.2K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/helper/LanguageHelper.java

    import java.util.Arrays;
    import java.util.Map;
    import java.util.stream.Collectors;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.apache.tika.language.detect.LanguageDetector;
    import org.apache.tika.language.detect.LanguageResult;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.mylasta.direction.FessConfig;
    import org.codelibs.fess.util.ComponentUtil;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 6.9K bytes
    - Viewed (0)
  10. pom.xml

    			<groupId>com.ibm.icu</groupId>
    			<artifactId>icu4j</artifactId>
    			<version>${icu4j.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.apache.tika</groupId>
    			<artifactId>tika-langdetect-optimaize</artifactId>
    			<version>${tika.version}</version>
    			<exclusions>
    				<exclusion>
    					<groupId>javax.annotation</groupId>
    					<artifactId>javax.annotation-api</artifactId>
    				</exclusion>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Sep 04 05:22:58 UTC 2025
    - 49.6K bytes
    - Viewed (0)
Back to top