- Sort Score
- Result 10 results
- Languages All
Results 1 - 9 of 9 for compressor (0.03 sec)
-
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractorTest.java
*/ package org.codelibs.fess.crawler.extractor.impl; import java.io.IOException; import java.io.InputStream; import org.apache.commons.compress.archivers.ArchiveStreamFactory; import org.apache.commons.compress.compressors.CompressorStreamFactory; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.core.io.CloseableUtil;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 3.7K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TarExtractorTest.java
*/ package org.codelibs.fess.crawler.extractor.impl; import java.io.IOException; import java.io.InputStream; import org.apache.commons.compress.archivers.ArchiveStreamFactory; import org.apache.commons.compress.compressors.CompressorStreamFactory; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.core.io.CloseableUtil;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 3.7K bytes - Viewed (0) -
README.md
- RTF, WordPerfect #### PDFs and Images - PDF documents (text and metadata extraction) - Images (JPEG, PNG, GIF, TIFF, BMP) - Image metadata (EXIF, IPTC, XMP) #### Archives and Compressed Files - ZIP, TAR, GZ archives - LHA compression format - Nested archive extraction #### Web and Markup - HTML, XHTML with XPath support - XML documents - JSON and structured data #### Media Files
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Aug 31 05:32:52 UTC 2025 - 15.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractor.java
import java.io.BufferedInputStream; import java.io.InputStream; import java.util.HashMap; import java.util.Map; import org.apache.commons.compress.archivers.ArchiveInputStream; import org.apache.commons.compress.archivers.ArchiveStreamFactory; import org.apache.commons.compress.archivers.zip.ZipArchiveEntry; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.5K bytes - Viewed (0) -
fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml
<_comment>ZLIB Compressed Data Format</_comment> <tika:link>http://tools.ietf.org/html/rfc1950</tika:link> <magic priority="45"> <!-- Low/No compression --> <match value="\x78\x01" type="string" offset="0" /> <!-- Medium compression --> <match value="\x78\x5e" type="string" offset="0" /> <!-- Default compression -->
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Mar 13 08:18:01 UTC 2025 - 320.1K bytes - Viewed (1) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TarExtractor.java
package org.codelibs.fess.crawler.extractor.impl; import java.io.InputStream; import java.util.HashMap; import java.util.Map; import org.apache.commons.compress.archivers.ArchiveInputStream; import org.apache.commons.compress.archivers.ArchiveStreamFactory; import org.apache.commons.compress.archivers.tar.TarArchiveEntry; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.core.io.CloseableUtil;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 5K bytes - Viewed (0) -
fess-crawler-lasta/src/main/resources/crawler/extractor.xml
"application/vnd.motorola.flexsuite.wem", "application/vnd.motorola.iprm", "application/vnd.mozilla.xul+xml", "application/vnd.ms-artgalry", "application/vnd.ms-asf", "application/vnd.ms-cab-compressed", "application/vnd.ms-excel", "application/vnd.ms-excel.addin.macroenabled.12", "application/vnd.ms-excel.sheet.macroenabled.12", "application/vnd.ms-excel.sheet.binary.macroenabled.12",
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Aug 01 21:40:30 UTC 2020 - 49K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java
import org.xml.sax.helpers.DefaultHandler; /** * Helper class for parsing and validating sitemaps. * It supports XML sitemaps, XML sitemap indexes, and text sitemaps, * and can handle GZIP compressed sitemaps. * The class provides methods to check if an input stream is a valid sitemap, * and to parse an input stream into a {@link SitemapSet} object. * It uses SAX parser for XML sitemaps and XML sitemap indexes,Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 14.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java
*/ public void setReadAsTextIfFailed(final boolean readAsTextIfFailed) { this.readAsTextIfFailed = readAsTextIfFailed; } /** * Sets the maximum compression ratio. * @param maxCompressionRatio The max compression ratio. */ public void setMaxCompressionRatio(final long maxCompressionRatio) { this.maxCompressionRatio = maxCompressionRatio; } /**Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 30.7K bytes - Viewed (0)