- Sort Score
- Result 10 results
- Languages All
Results 21 - 30 of 73 for etext (0.01 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/TextTransformer.java
import jakarta.annotation.Resource; /** * TextTransformer is a class that transforms a ResponseData object into a ResultData object containing the extracted text content. * It uses an Extractor to extract the text from the response body based on the MIME type. * The extracted text is then converted into a byte array using the specified charset encoding.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 6.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java
* The {@link TikaExtractor} class is responsible for extracting text content and metadata from various file formats * using the Apache Tika library. It extends {@link PasswordBasedExtractor} to handle password-protected files. * </p> * * <p> * This class provides methods to extract text from an input stream, handling different scenarios such as: * </p> * <ul> * <li>Normalizing text content</li>Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 30.7K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/client/smb/SmbAuthenticationHolderTest.java
assertEquals(fooAuth, smbAuthenticationHolder.get("smb://foo:1000/")); assertEquals(hogeAuth, smbAuthenticationHolder.get("smb://hoge/text.txt")); assertEquals(fugaAuth, smbAuthenticationHolder.get("smb://fuga/text.txt")); assertEquals(fooAuth, smbAuthenticationHolder.get("smb://foo:1000/text.txt")); assertNull(smbAuthenticationHolder.get(null)); assertNull(smbAuthenticationHolder.get(""));
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 2.3K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractorTest.java
LhaExtractor lhaExtractor = container.getComponent("lhaExtractor"); factory.addExtractor("text/plain", tikaExtractor); factory.addExtractor("text/html", tikaExtractor); factory.addExtractor("application/x-lha", lhaExtractor); })// ;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 3.4K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/CommandExtractorTest.java
extractor.command = getCommand(scriptFile); final Map<String, String> params = new HashMap<String, String>(); final ExtractData text = extractor.getText(new FileInputStream(contentFile), params); assertEquals(content, text.getContent()); } public void test_getText_withUrl() throws IOException { final File scriptFile = createScriptTempFile(3);
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 9.8K bytes - Viewed (0) -
fess-crawler/src/test/resources/extractor/test.mm
<map version="0.7.1"> <node TEXT="タイトル"> <node TEXT="テスト" MODIFIED="1237874353965" STYLE="fork"/> </node>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 162 bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/TextTransformerTest.java
TikaExtractor tikaExtractor = container.getComponent("tikaExtractor"); extractorFactory.addExtractor("text/plain", tikaExtractor); extractorFactory.addExtractor("text/html", tikaExtractor); } public void test_name() { assertEquals("textTransformer", textTransformer.getName()); }
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 4.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java
import org.apache.commons.io.input.BOMInputStream; import org.apache.commons.text.translate.AggregateTranslator; import org.apache.commons.text.translate.CharSequenceTranslator; import org.apache.commons.text.translate.EntityArrays; import org.apache.commons.text.translate.LookupTranslator; import org.apache.commons.text.translate.NumericEntityUnescaper; import org.apache.logging.log4j.LogManager;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 8.5K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/client/smb1/SmbAuthenticationHolderTest.java
assertEquals(fooAuth, smbAuthenticationHolder.get("smb1://foo:1000/")); assertEquals(hogeAuth, smbAuthenticationHolder.get("smb1://hoge/text.txt")); assertEquals(fugaAuth, smbAuthenticationHolder.get("smb1://fuga/text.txt")); assertEquals(fooAuth, smbAuthenticationHolder.get("smb1://foo:1000/text.txt")); assertNull(smbAuthenticationHolder.get(null)); assertNull(smbAuthenticationHolder.get(""));
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 2.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java
import org.jodconverter.core.office.OfficeManager; import org.jodconverter.local.LocalConverter; import jakarta.annotation.PostConstruct; import jakarta.annotation.PreDestroy; /** * Extracts text content from various document formats using JODConverter. */ public class JodExtractor extends AbstractExtractor { /** Logger for this class. */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10.3K bytes - Viewed (0)