Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 9 of 9 for compressor (0.03 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractorTest.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.IOException;
    import java.io.InputStream;
    
    import org.apache.commons.compress.archivers.ArchiveStreamFactory;
    import org.apache.commons.compress.compressors.CompressorStreamFactory;
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.CloseableUtil;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 3.7K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TarExtractorTest.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.IOException;
    import java.io.InputStream;
    
    import org.apache.commons.compress.archivers.ArchiveStreamFactory;
    import org.apache.commons.compress.compressors.CompressorStreamFactory;
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.CloseableUtil;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 3.7K bytes
    - Viewed (0)
  3. README.md

    - RTF, WordPerfect
    
    #### PDFs and Images
    - PDF documents (text and metadata extraction)
    - Images (JPEG, PNG, GIF, TIFF, BMP)
    - Image metadata (EXIF, IPTC, XMP)
    
    #### Archives and Compressed Files
    - ZIP, TAR, GZ archives
    - LHA compression format
    - Nested archive extraction
    
    #### Web and Markup
    - HTML, XHTML with XPath support
    - XML documents
    - JSON and structured data
    
    #### Media Files
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractor.java

    import java.io.BufferedInputStream;
    import java.io.InputStream;
    import java.util.HashMap;
    import java.util.Map;
    
    import org.apache.commons.compress.archivers.ArchiveInputStream;
    import org.apache.commons.compress.archivers.ArchiveStreamFactory;
    import org.apache.commons.compress.archivers.zip.ZipArchiveEntry;
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  5. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

        <_comment>ZLIB Compressed Data Format</_comment>
        <tika:link>http://tools.ietf.org/html/rfc1950</tika:link>
        <magic priority="45">
          <!-- Low/No compression -->
          <match value="\x78\x01" type="string" offset="0" />
          <!-- Medium compression -->
          <match value="\x78\x5e" type="string" offset="0" />
          <!-- Default compression -->
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TarExtractor.java

    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.InputStream;
    import java.util.HashMap;
    import java.util.Map;
    
    import org.apache.commons.compress.archivers.ArchiveInputStream;
    import org.apache.commons.compress.archivers.ArchiveStreamFactory;
    import org.apache.commons.compress.archivers.tar.TarArchiveEntry;
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.CloseableUtil;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5K bytes
    - Viewed (0)
  7. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    				"application/vnd.motorola.flexsuite.wem",
    				"application/vnd.motorola.iprm",
    				"application/vnd.mozilla.xul+xml",
    				"application/vnd.ms-artgalry",
    				"application/vnd.ms-asf",
    				"application/vnd.ms-cab-compressed",
    				"application/vnd.ms-excel",
    				"application/vnd.ms-excel.addin.macroenabled.12",
    				"application/vnd.ms-excel.sheet.macroenabled.12",
    				"application/vnd.ms-excel.sheet.binary.macroenabled.12",
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Aug 01 21:40:30 UTC 2020
    - 49K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java

    import org.xml.sax.helpers.DefaultHandler;
    
    /**
     * Helper class for parsing and validating sitemaps.
     * It supports XML sitemaps, XML sitemap indexes, and text sitemaps,
     * and can handle GZIP compressed sitemaps.
     * The class provides methods to check if an input stream is a valid sitemap,
     * and to parse an input stream into a {@link SitemapSet} object.
     * It uses SAX parser for XML sitemaps and XML sitemap indexes,
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.7K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

         */
        public void setReadAsTextIfFailed(final boolean readAsTextIfFailed) {
            this.readAsTextIfFailed = readAsTextIfFailed;
        }
    
        /**
         * Sets the maximum compression ratio.
         * @param maxCompressionRatio The max compression ratio.
         */
        public void setMaxCompressionRatio(final long maxCompressionRatio) {
            this.maxCompressionRatio = maxCompressionRatio;
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
Back to top