Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 19 of 19 for tikai (0.11 sec)

  1. src/main/java/org/codelibs/fess/helper/LanguageHelper.java

    import java.util.Arrays;
    import java.util.Map;
    import java.util.stream.Collectors;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.apache.tika.language.detect.LanguageDetector;
    import org.apache.tika.language.detect.LanguageResult;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.mylasta.direction.FessConfig;
    import org.codelibs.fess.util.ComponentUtil;
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Feb 22 01:53:18 UTC 2024
    - 5.5K bytes
    - Viewed (0)
  2. pom.xml

    			<groupId>com.ibm.icu</groupId>
    			<artifactId>icu4j</artifactId>
    			<version>${icu4j.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.apache.tika</groupId>
    			<artifactId>tika-langdetect-optimaize</artifactId>
    			<version>${tika.version}</version>
    			<exclusions>
    				<exclusion>
    					<groupId>javax.annotation</groupId>
    					<artifactId>javax.annotation-api</artifactId>
    				</exclusion>
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Sat Oct 26 02:16:03 UTC 2024
    - 49.1K bytes
    - Viewed (0)
  3. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    				"application/x-texinfo",
    				"application/x-tika-msoffice",
    				"application/x-tika-msoffice-embedded",
    				"application/x-tika-msoffice-embedded;format=ole10_native",
    				"application/x-tika-msoffice-embedded;format=comp_obj",
    				"application/x-tika-msworks-spreadsheet",
    				"application/x-tika-ooxml",
    				"application/x-tika-ooxml-protected",
    				"application/x-tika-staroffice",
    				"application/x-uc2-compressed",
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sat Aug 01 21:40:30 UTC 2020
    - 49K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/job/CrawlJob.java

            } else {
                cmdList.add("-Dfess.log.level=" + logLevel);
                if ("debug".equalsIgnoreCase(logLevel)) {
                    cmdList.add("-Dorg.apache.tika.service.error.warn=true");
                }
            }
            stream(fessConfig.getJvmCrawlerOptionsAsArray())
                    .of(stream -> stream.filter(StringUtil::isNotBlank).forEach(value -> cmdList.add(value)));
    
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Sun Jun 23 04:13:47 UTC 2024
    - 15.1K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractorTest.java

            final String content = extractData.getContent();
            CloseableUtil.closeQuietly(in);
            logger.info(content);
            assertTrue(content.contains("ใƒ†ใ‚นใƒˆ"));
        }
    
        // TODO tika needs to support pdfbox 2.0
        //    public void test_getTika_pdf() {
        //        final InputStream in = ResourceUtil
        //                .getResourceAsStream("extractor/test.pdf");
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 30.5K bytes
    - Viewed (0)
  6. src/main/resources/fess_config.properties

    crawler.hotthread.snapshots=10
    crawler.hotthread.threads=3
    crawler.hotthread.timeout=30s
    crawler.hotthread.type=cpu
    crawler.metadata.content.excludes=resourceName,X-Parsed-By,Content-Encoding.*,Content-Type.*,X-TIKA.*,X-FESS.*
    crawler.metadata.name.mapping=\
    title=title:string\n\
    Title=title:string\n\
    dc:title=title:string\n\
    
    # html
    crawler.document.html.content.xpath=//BODY
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Tue Oct 01 14:13:38 UTC 2024
    - 30.9K bytes
    - Viewed (0)
  7. okhttp/src/main/resources/okhttp3/internal/publicsuffix/PublicSuffixDatabase.gz

    tochigi.tochigi.jp tochio.niigata.jp toda.saitama.jp today toei.aichi.jp toga.toyama.jp togakushi.nagano.jp togane.chiba.jp togitsu.nagasaki.jp togliatti.su togo.aichi.jp togura.nagano.jp tohma.hokkaido.jp tohnosho.chiba.jp toho.fukuoka.jp tokai.aichi.jp tokai.ibaraki.jp tokamachi.niigata.jp tokashiki.okinawa.jp toki.gifu.jp tokigawa.saitama.jp tokke.no tokoname.aichi.jp tokorozawa.saitama.jp tokushima.jp tokushima.tokushima.jp tokuyama.yamaguchi.jp tokyo tokyo.jp tolga.no tomakomai.hokkaido.jp tomari.hokkaido.jp...
    Registered: Fri Nov 01 11:42:11 UTC 2024
    - Last Modified: Wed Dec 20 23:27:07 UTC 2023
    - 40.4K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java

        /** The key of the configuration. e.g. cpu */
        String CRAWLER_HOTTHREAD_TYPE = "crawler.hotthread.type";
    
        /** The key of the configuration. e.g. resourceName,X-Parsed-By,Content-Encoding.*,Content-Type.*,X-TIKA.*,X-FESS.* */
        String CRAWLER_METADATA_CONTENT_EXCLUDES = "crawler.metadata.content.excludes";
    
        /** The key of the configuration. e.g. title=title:string<br>
         * Title=title:string<br>
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri Oct 11 21:11:58 UTC 2024
    - 468.5K bytes
    - Viewed (1)
  9. okhttp/src/test/resources/okhttp3/internal/publicsuffix/public_suffix_list.dat

    okazaki.aichi.jp
    owariasahi.aichi.jp
    seto.aichi.jp
    shikatsu.aichi.jp
    shinshiro.aichi.jp
    shitara.aichi.jp
    tahara.aichi.jp
    takahama.aichi.jp
    tobishima.aichi.jp
    toei.aichi.jp
    togo.aichi.jp
    tokai.aichi.jp
    tokoname.aichi.jp
    toyoake.aichi.jp
    toyohashi.aichi.jp
    toyokawa.aichi.jp
    toyone.aichi.jp
    toyota.aichi.jp
    tsushima.aichi.jp
    yatomi.aichi.jp
    akita.akita.jp
    daisen.akita.jp
    Registered: Fri Nov 01 11:42:11 UTC 2024
    - Last Modified: Wed Dec 20 23:27:07 UTC 2023
    - 240.3K bytes
    - Viewed (0)
Back to top