Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 30 for tika (0.07 sec)

  1. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    				"application/x-texinfo",
    				"application/x-tika-msoffice",
    				"application/x-tika-msoffice-embedded",
    				"application/x-tika-msoffice-embedded;format=ole10_native",
    				"application/x-tika-msoffice-embedded;format=comp_obj",
    				"application/x-tika-msworks-spreadsheet",
    				"application/x-tika-ooxml",
    				"application/x-tika-ooxml-protected",
    				"application/x-tika-staroffice",
    				"application/x-uc2-compressed",
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sat Aug 01 21:40:30 UTC 2020
    - 49K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/job/CrawlJob.java

            } else {
                cmdList.add("-Dfess.log.level=" + logLevel);
                if ("debug".equalsIgnoreCase(logLevel)) {
                    cmdList.add("-Dorg.apache.tika.service.error.warn=true");
                }
            }
            stream(fessConfig.getJvmCrawlerOptionsAsArray())
                    .of(stream -> stream.filter(StringUtil::isNotBlank).forEach(value -> cmdList.add(value)));
    
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Sun Jun 23 04:13:47 UTC 2024
    - 15.1K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractorTest.java

            final String content = extractData.getContent();
            CloseableUtil.closeQuietly(in);
            logger.info(content);
            assertTrue(content.contains("テスト"));
        }
    
        // TODO tika needs to support pdfbox 2.0
        //    public void test_getTika_pdf() {
        //        final InputStream in = ResourceUtil
        //                .getResourceAsStream("extractor/test.pdf");
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 30.5K bytes
    - Viewed (0)
  4. src/main/resources/fess_config.properties

    crawler.hotthread.snapshots=10
    crawler.hotthread.threads=3
    crawler.hotthread.timeout=30s
    crawler.hotthread.type=cpu
    crawler.metadata.content.excludes=resourceName,X-Parsed-By,Content-Encoding.*,Content-Type.*,X-TIKA.*,X-FESS.*
    crawler.metadata.name.mapping=\
    title=title:string\n\
    Title=title:string\n\
    dc:title=title:string\n\
    
    # html
    crawler.document.html.content.xpath=//BODY
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Tue Oct 01 14:13:38 UTC 2024
    - 30.9K bytes
    - Viewed (0)
  5. src/main/resources/fess_indices/_aws/fess.json

    "taču", "nu", "pat", "tiklab", "iekšpus", "nedz", "tik", "nevis", "turpretim", "jeb", "iekam", "iekām", "iekāms", "kolīdz", "līdzko", "tiklīdz", "jebšu", "tālab", "tāpēc", "nekā", "itin", "jā", "jau", "jel", "nē", "nezin", "tad", "tikai", "vis", "tak", "iekams", "vien", "# modal verbs", "būt  ", "biju ", "biji", "bija", "bijām", "bijāt", "esmu", "esi", "esam", "esat ", "būšu     ", "būsi", "būs", "būsim", "būsiet", "tikt", "tiku", "tiki", "tika", "tikām", "tikāt", "tieku", "tiec", "tiek", "tiekam",...
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Tue Mar 23 12:38:28 UTC 2021
    - 117.3K bytes
    - Viewed (0)
  6. src/main/resources/fess_indices/_cloud/fess.json

    "taču", "nu", "pat", "tiklab", "iekšpus", "nedz", "tik", "nevis", "turpretim", "jeb", "iekam", "iekām", "iekāms", "kolīdz", "līdzko", "tiklīdz", "jebšu", "tālab", "tāpēc", "nekā", "itin", "jā", "jau", "jel", "nē", "nezin", "tad", "tikai", "vis", "tak", "iekams", "vien", "# modal verbs", "būt  ", "biju ", "biji", "bija", "bijām", "bijāt", "esmu", "esi", "esam", "esat ", "būšu     ", "būsi", "būs", "būsim", "būsiet", "tikt", "tiku", "tiki", "tika", "tikām", "tikāt", "tieku", "tiec", "tiek", "tiekam",...
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Sat Feb 27 09:26:16 UTC 2021
    - 117.3K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java

        /** The key of the configuration. e.g. cpu */
        String CRAWLER_HOTTHREAD_TYPE = "crawler.hotthread.type";
    
        /** The key of the configuration. e.g. resourceName,X-Parsed-By,Content-Encoding.*,Content-Type.*,X-TIKA.*,X-FESS.* */
        String CRAWLER_METADATA_CONTENT_EXCLUDES = "crawler.metadata.content.excludes";
    
        /** The key of the configuration. e.g. title=title:string<br>
         * Title=title:string<br>
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri Oct 11 21:11:58 UTC 2024
    - 468.5K bytes
    - Viewed (1)
  8. guava-tests/test/com/google/common/base/SplitterTest.java

            COMMA_SPLITTER
                .trimResults()
                .withKeyValueSeparator(Splitter.on(':').trimResults())
                .split("boy  : tom , girl: tina , cat  : kitty , dog: tommy ");
        ImmutableMap<String, String> expected =
            ImmutableMap.of("boy", "tom", "girl", "tina", "cat", "kitty", "dog", "tommy");
        assertThat(m).isEqualTo(expected);
        assertThat(m.entrySet()).containsExactlyElementsIn(expected.entrySet()).inOrder();
    Registered: Fri Nov 01 12:43:10 UTC 2024
    - Last Modified: Tue Sep 17 18:14:12 UTC 2024
    - 29.6K bytes
    - Viewed (0)
  9. src/main/resources/fess_indices/fess/gl/stopwords.txt

    polas
    polo
    polos
    por
    que
    se
    senón
    ser
    seu
    seus
    sexa
    sido
    sobre
    súa
    súas
    tamén
    tan
    te
    ten
    teñen
    teño
    ter
    teu
    teus
    ti
    tido
    tiña
    tiven
    túa
    túas
    un
    unha
    unhas
    uns
    vos
    vosa
    vosas
    voso
    vosos
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Jul 19 06:31:02 UTC 2018
    - 932 bytes
    - Viewed (0)
  10. src/main/resources/fess_indices/fess/fi/stopwords.txt

    ketä
    kenessä
    kenestä
    keneen
    kenellä
    keneltä
    kenelle
    kenenä
    keneksi
    ketkä
    keiden
    ketkä
    keitä
    keissä
    keistä
    keihin
    keillä
    keiltä
    keille
    keinä
    keiksi
    mikä
    minkä
    minkä
    mitä
    missä
    mistä
    mihin
    millä
    miltä
    mille
    minä
    miksi
    mitkä
    joka
    jonka
    jota
    jossa
    josta
    johon
    jolla
    jolta
    jolle
    jona
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Mon Nov 27 12:59:36 UTC 2023
    - 1.7K bytes
    - Viewed (0)
Back to top