- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 25 for extras (0.14 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractor.java
import org.codelibs.fess.crawler.extractor.ExtractorFactory; import org.codelibs.fess.crawler.helper.MimeTypeHelper; import org.codelibs.fess.crawler.util.IgnoreCloseInputStream; import jakarta.annotation.Resource; /** * Extracts text content from ZIP archives. */ public class ZipExtractor extends AbstractExtractor { private static final Logger logger = LogManager.getLogger(ZipExtractor.class); /** * The archive stream factory.Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TarExtractor.java
import org.codelibs.fess.crawler.extractor.ExtractorFactory; import org.codelibs.fess.crawler.helper.MimeTypeHelper; import org.codelibs.fess.crawler.util.IgnoreCloseInputStream; import jakarta.annotation.Resource; /** * Extracts text content from TAR archives. */ public class TarExtractor extends AbstractExtractor { private static final Logger logger = LogManager.getLogger(TarExtractor.class); /** * The archive stream factory.Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractor.java
import jp.gr.java_conf.dangan.util.lha.LhaFile; import jp.gr.java_conf.dangan.util.lha.LhaHeader; /** * Extractor implementation for LHA (LZH) archive files. * This extractor can extract text content from files within LHA archives * by using appropriate extractors for each contained file type. * * @author shinsuke */ public class LhaExtractor extends AbstractExtractor {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 5.8K bytes - Viewed (0) -
src/test/java/org/codelibs/opensearch/extension/ExtensionPlugin.java
extra.put("reloadable_ja_stop", JapaneseStopTokenFilterFactory::new); extra.put("kanji_number", KanjiNumberFilterFactory::new); extra.put("kuromoji_pos_concat", PosConcatenationFilterFactory::new); extra.put("char_type", CharTypeFilterFactory::new); extra.put("number_concat", NumberConcatenationFilterFactory::new);
Registered: Fri Sep 19 09:08:11 UTC 2025 - Last Modified: Tue Jul 08 14:37:06 UTC 2025 - 5.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/Extractor.java
* optionally override the default weight value. */ public interface Extractor { /** * Extracts text data from the given input stream. * * @param in the input stream to extract text from * @param params a map of parameters to be used during extraction * @return an ExtractData object containing the extracted text */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 1.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java
}); return extractData; } finally { xpathAPI.remove(); } } /** * Extracts strings from a document using the specified XPath expression. * * @param document the DOM document to extract strings from * @param path the XPath expression to evaluate * @return an array of strings extracted from the document */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 9.3K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/suggest/index/contents/ContentsParser.java
ReadingConverter readingConverter, Normalizer normalizer); /** * Parses a document and extracts suggest items based on the provided fields and converters. * * @param document The document to parse, represented as a map of field names to values. * @param fields The fields to extract from the document. * @param tagFieldNames The names of the fields that contain tags.Registered: Fri Sep 19 09:08:11 UTC 2025 - Last Modified: Sat Mar 15 06:51:20 UTC 2025 - 4.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java
throw new RobotsTxtException("Failed to parse robots.txt.", e); } } /** * Extracts the value from a line using the given pattern. * @param pattern the pattern to match against * @param line the line to extract the value from * @return the extracted value, or null if no match */ protected String getValue(final Pattern pattern, final String line) {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 7.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java
throw new ExtractException(e); } } return encoding; } /** * Extracts text content from the given content by removing tags and processing attributes. * @param content The content to extract from. * @return The extracted text. */ protected String extractString(final String content) {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 8.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPowerPointExtractor.java
import org.codelibs.fess.crawler.exception.ExtractException; /** * Extracts text content from Microsoft PowerPoint documents. */ public class MsPowerPointExtractor extends AbstractExtractor { /** * Creates a new MsPowerPointExtractor instance. */ public MsPowerPointExtractor() { super(); } /** * Extracts text from the PowerPoint input stream. * @param in The input stream.Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2.1K bytes - Viewed (0)