Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 3 of 3 for textExtractor (0.08 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TextExtractor.java

    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * @author shinsuke
     *
     */
    public class TextExtractor extends AbstractExtractor {
    
        protected String encoding = Constants.UTF_8;
    
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            if (in == null) {
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 1.7K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TextExtractorTest.java

        public TextExtractor textExtractor;
    
        @Override
        protected void setUp() throws Exception {
            super.setUp();
            StandardCrawlerContainer container = new StandardCrawlerContainer().singleton("textExtractor", TextExtractor.class);
            textExtractor = container.getComponent("textExtractor");
        }
    
        public void test_getText() {
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 2K bytes
    - Viewed (0)
  3. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    		class="org.codelibs.fess.crawler.extractor.impl.PdfExtractor" />
    	<component name="lhaExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.LhaExtractor" />
    	<component name="textExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.TextExtractor" />
    	<component name="htmlExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.HtmlExtractor">
    		<property name="featureMap">
    			<component class="java.util.LinkedHashMap">
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sat Aug 01 21:40:30 UTC 2020
    - 49K bytes
    - Viewed (0)
Back to top