Search Options

Results per page
Sort
Preferred Languages
Advance

Results 21 - 30 of 73 for etext (0.01 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/TextTransformer.java

    import jakarta.annotation.Resource;
    
    /**
     * TextTransformer is a class that transforms a ResponseData object into a ResultData object containing the extracted text content.
     * It uses an Extractor to extract the text from the response body based on the MIME type.
     * The extracted text is then converted into a byte array using the specified charset encoding.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

     * The {@link TikaExtractor} class is responsible for extracting text content and metadata from various file formats
     * using the Apache Tika library. It extends {@link PasswordBasedExtractor} to handle password-protected files.
     * </p>
     *
     * <p>
     * This class provides methods to extract text from an input stream, handling different scenarios such as:
     * </p>
     * <ul>
     *   <li>Normalizing text content</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/smb/SmbAuthenticationHolderTest.java

            assertEquals(fooAuth, smbAuthenticationHolder.get("smb://foo:1000/"));
            assertEquals(hogeAuth, smbAuthenticationHolder.get("smb://hoge/text.txt"));
            assertEquals(fugaAuth, smbAuthenticationHolder.get("smb://fuga/text.txt"));
            assertEquals(fooAuth, smbAuthenticationHolder.get("smb://foo:1000/text.txt"));
    
            assertNull(smbAuthenticationHolder.get(null));
            assertNull(smbAuthenticationHolder.get(""));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 2.3K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractorTest.java

                        LhaExtractor lhaExtractor = container.getComponent("lhaExtractor");
                        factory.addExtractor("text/plain", tikaExtractor);
                        factory.addExtractor("text/html", tikaExtractor);
                        factory.addExtractor("application/x-lha", lhaExtractor);
    
                    })//
            ;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/CommandExtractorTest.java

            extractor.command = getCommand(scriptFile);
            final Map<String, String> params = new HashMap<String, String>();
            final ExtractData text = extractor.getText(new FileInputStream(contentFile), params);
            assertEquals(content, text.getContent());
        }
    
        public void test_getText_withUrl() throws IOException {
            final File scriptFile = createScriptTempFile(3);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 9.8K bytes
    - Viewed (0)
  6. fess-crawler/src/test/resources/extractor/test.mm

    <map version="0.7.1">
    <node TEXT="&#12479;&#12452;&#12488;&#12523;">
    <node TEXT="&#12486;&#12473;&#12488;" MODIFIED="1237874353965" STYLE="fork"/>
    </node>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 162 bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/TextTransformerTest.java

            TikaExtractor tikaExtractor = container.getComponent("tikaExtractor");
            extractorFactory.addExtractor("text/plain", tikaExtractor);
            extractorFactory.addExtractor("text/html", tikaExtractor);
        }
    
        public void test_name() {
            assertEquals("textTransformer", textTransformer.getName());
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 4.6K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

    import org.apache.commons.io.input.BOMInputStream;
    import org.apache.commons.text.translate.AggregateTranslator;
    import org.apache.commons.text.translate.CharSequenceTranslator;
    import org.apache.commons.text.translate.EntityArrays;
    import org.apache.commons.text.translate.LookupTranslator;
    import org.apache.commons.text.translate.NumericEntityUnescaper;
    import org.apache.logging.log4j.LogManager;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
  9. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/smb1/SmbAuthenticationHolderTest.java

            assertEquals(fooAuth, smbAuthenticationHolder.get("smb1://foo:1000/"));
            assertEquals(hogeAuth, smbAuthenticationHolder.get("smb1://hoge/text.txt"));
            assertEquals(fugaAuth, smbAuthenticationHolder.get("smb1://fuga/text.txt"));
            assertEquals(fooAuth, smbAuthenticationHolder.get("smb1://foo:1000/text.txt"));
    
            assertNull(smbAuthenticationHolder.get(null));
            assertNull(smbAuthenticationHolder.get(""));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 2.3K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java

    import org.jodconverter.core.office.OfficeManager;
    import org.jodconverter.local.LocalConverter;
    
    import jakarta.annotation.PostConstruct;
    import jakarta.annotation.PreDestroy;
    
    /**
     * Extracts text content from various document formats using JODConverter.
     */
    public class JodExtractor extends AbstractExtractor {
        /** Logger for this class. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
Back to top