Search Options

Results per page
Sort
Preferred Languages
Advance

Results 61 - 70 of 103 for etext (0.01 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPowerPointExtractor.java

    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Extracts text content from Microsoft PowerPoint documents.
     */
    public class MsPowerPointExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsPowerPointExtractor instance.
         */
        public MsPowerPointExtractor() {
            super();
        }
    
        /**
         * Extracts text from the PowerPoint input stream.
         * @param in The input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.1K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsVisioExtractor.java

    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from . file.
     *
     * @author shinsuke
     *
     */
    public class MsVisioExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsVisioExtractor instance.
         */
        public MsVisioExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Visio input stream.
         * @param in The input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/suggest/converter/KatakanaConverter.java

             */
        }
    
        @Override
        public List<String> convert(final String text, final String field, final String... langs) throws IOException {
            final List<String> readingList = new ArrayList<>();
            readingList.add(toKatakana(text));
            return readingList;
        }
    
        /**
         * Converts the input string to Katakana.
         * @param inputStr The input string.
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Fri Jul 04 14:00:23 UTC 2025
    - 6.1K bytes
    - Viewed (0)
  4. src/test/java/org/codelibs/fess/suggest/settings/AnalyzerSettingsTest.java

            String text = "Fess (フェス) は「5 分で簡単に構築可能な全文検索サーバー」です。 Java 実行環境があればどの OS でも実行可能です。 Fess は Apache ライセンスで提供され、無料 (フリーソフト) でご利用いただけます。";
            SuggestAnalyzer analyzer = SuggestUtil.createDefaultAnalyzer(runner.client(), settings);
            final List<AnalyzeToken> tokens = analyzer.analyze(text, "", null);
            final List<AnalyzeToken> readingTokens = analyzer.analyzeAndReading(text, "", null);
    
            int matchCount = 0;
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 5.2K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractorTest.java

            final Map<String, String> params = new HashMap<String, String>();
            //final ExtractData text = extractor.getText(new ByteArrayInputStream(FileUtils.readFileToByteArray(new File(filePath))), params);
            final ExtractData text = extractor.getText(new ByteArrayInputStream(testStr.getBytes()), params);
            assertEquals(content, text.getContent());
        }
    
        // TODO other tests
    
        static class TestApiExtractorServer {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 5.4K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TarExtractorTest.java

                        TarExtractor tarExtractor = container.getComponent("tarExtractor");
                        factory.addExtractor("text/plain", tikaExtractor);
                        factory.addExtractor("text/html", tikaExtractor);
                        factory.addExtractor("application/tar", tarExtractor);
                    })//
            ;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 3.7K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractor.java

         */
        public LhaExtractor() {
            super();
        }
    
        /**
         * Extracts text content from an LHA archive input stream.
         *
         * @param in the input stream containing the LHA archive
         * @param params extraction parameters
         * @return the extracted text data
         * @throws CrawlerSystemException if the input stream is null
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5.8K bytes
    - Viewed (0)
  8. fess-crawler/src/test/resources/html/test1.shtml

    <html>
    <head>
    <meta http-equiv="Content-Type" content="text/html; charset=UTF-8"/>
    <title>タイトル</title>
    </head>
    <body>
    <h1>第一章</h1>
    <h2>第一節</h2>
    <p>ほげほげ<br>ふがふが</p>
    <p>
    <a href="test2.html">LINK</a>
    </p>
    <h1>第2章</h1>
    <h2>第2節</h2>
    </body>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 289 bytes
    - Viewed (0)
  9. fess-crawler/src/test/resources/html/test1.html

    <html>
    <head>
    <meta http-equiv="Content-Type" content="text/html; charset=UTF-8"/>
    <title>タイトル</title>
    </head>
    <body>
    <h1>第一章</h1>
    <h2>第一節</h2>
    <p>ほげほげ<br>ふがふが</p>
    <p>
    <a href="test2.html">LINK</a>
    </p>
    <h1>第2章</h1>
    <h2>第2節</h2>
    </body>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 289 bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java

    import org.xml.sax.SAXNotSupportedException;
    import org.xml.sax.helpers.DefaultHandler;
    
    /**
     * Helper class for parsing and validating sitemaps.
     * It supports XML sitemaps, XML sitemap indexes, and text sitemaps,
     * and can handle GZIP compressed sitemaps.
     * The class provides methods to check if an input stream is a valid sitemap,
     * and to parse an input stream into a {@link SitemapSet} object.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.7K bytes
    - Viewed (0)
Back to top