- Sort Score
- Result 10 results
- Languages All
Results 11 - 20 of 75 for Next (0.05 sec)
-
fess-crawler-lasta/src/main/resources/crawler/extractor.xml
"text/x-cobol", "text/x-coldfusion", "text/x-common-lisp", "text/x-diff", "text/x-eiffel", "text/x-emacs-lisp", "text/x-erlang", "text/x-expect", "text/x-forth", "text/x-fortran", "text/x-go", "text/x-groovy", "text/x-haskell", "text/x-idl", "text/x-ini", "text/x-java-source", "text/x-jsp",
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Aug 01 21:40:30 UTC 2020 - 49K bytes - Viewed (0) -
fess-crawler/src/test/resources/extractor/test_sjis.html
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 149 bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/Extractor.java
/** * The Extractor interface defines methods for extracting text data from an input stream. * Implementations of this interface should provide the logic for extracting text and * optionally override the default weight value. */ public interface Extractor { /** * Extracts text data from the given input stream. * * @param in the input stream to extract text fromRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 1.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractor.java
} /** * Extracts a date string from the received header text. * * @param text the received header text * @return the date string starting from the day of week, or null if not found */ private static String getDateString(final String text) { for (final String dow : DAY_OF_WEEK) { final int i = text.lastIndexOf(dow); if (i != -1) {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 12.6K bytes - Viewed (0) -
fess-crawler/src/test/resources/extractor/test_attr.html
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 308 bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/CommandExtractor.java
String ext; if (outputExtension == null) { if (StringUtil.isNotBlank(extention)) { ext = "." + extention; } else { ext = extention; } } else { ext = outputExtension; }Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 16K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractorTest.java
ZipExtractor zipExtractor = container.getComponent("zipExtractor"); factory.addExtractor("text/plain", tikaExtractor); factory.addExtractor("text/html", tikaExtractor); factory.addExtractor("application/zip", zipExtractor); })// ;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 3.7K bytes - Viewed (0) -
fess-crawler/src/test/resources/extractor/eml/sample2.eml
and @handle --> <span class="full_name_truncate" style="display:block;font-family:'Helvetica Neue Light', Helvetica, Arial, sans-serif;-webkit-font-smoothing:antialiased;-webkit-text-size-adjust:none;font-size:16px;text-align:left;color:#8899a6;padding:0px;margin:0px;line-height:20px;white-space:nowrap;overflow:hidden;text-overflow:ellipsis;width:289px;"><strong><a href="https://twitter.com/i/redirect?url=https%3A%2F%2Ftwitter.com%2Ftokyo_bousai%3Ft%3D1%26cn%3DZmxleGlibGVfcmVjc18y%26sig%3D469e0de...
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Jan 16 07:50:35 UTC 2016 - 91.6K bytes - Viewed (0) -
fess-crawler/src/test/resources/extractor/test_utf8.html
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 162 bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java
import org.codelibs.fess.crawler.exception.ExtractException; /** * Gets a text from .doc file. * * @author shinsuke * */ public class MsWordExtractor extends AbstractExtractor { /** * Creates a new MsWordExtractor instance. */ public MsWordExtractor() { super(); } /** * Extracts text from the Word input stream. * @param in The input stream.Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.9K bytes - Viewed (0)