Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 6 of 6 for 7zip (0.01 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractorTest.java

                        factory.addExtractor("application/zip", zipExtractor);
    
                    })//
            ;
    
            zipExtractor = container.getComponent("zipExtractor");
        }
    
        public void test_getText() {
            final InputStream in = ResourceUtil.getResourceAsStream("extractor/zip/test.zip");
            final String content = zipExtractor.getText(in, null).getContent();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 3.7K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java

    import org.xml.sax.helpers.DefaultHandler;
    
    /**
     * Helper class for parsing and validating sitemaps.
     * It supports XML sitemaps, XML sitemap indexes, and text sitemaps,
     * and can handle GZIP compressed sitemaps.
     * The class provides methods to check if an input stream is a valid sitemap,
     * and to parse an input stream into a {@link SitemapSet} object.
     * It uses SAX parser for XML sitemaps and XML sitemap indexes,
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.7K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractor.java

    import java.util.HashMap;
    import java.util.Map;
    
    import org.apache.commons.compress.archivers.ArchiveInputStream;
    import org.apache.commons.compress.archivers.ArchiveStreamFactory;
    import org.apache.commons.compress.archivers.zip.ZipArchiveEntry;
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractorTest.java

            assertEquals("かいしゃ", extractData.getValues("dc:publisher")[0]);
        }
    
        public void test_getTika_zip() {
            final InputStream in = ResourceUtil.getResourceAsStream("extractor/zip/test.zip");
            final ExtractData extractData = tikaExtractor.getText(in, null);
            final String content = extractData.getContent();
            CloseableUtil.closeQuietly(in);
            logger.info(content);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.6K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

     *   <li>Reading content as plain text if all other methods fail</li>
     *   <li>Applying post-extraction filters</li>
     *   <li>Handling Tika exceptions, including zip bomb exceptions</li>
     * </ul>
     *
     * <p>
     * The class also supports configuration options such as:
     * </p>
     * <ul>
     *   <li>Output encoding</li>
     *   <li>Maximum compression ratio and uncompression size</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  6. README.md

    - RTF, WordPerfect
    
    #### PDFs and Images
    - PDF documents (text and metadata extraction)
    - Images (JPEG, PNG, GIF, TIFF, BMP)
    - Image metadata (EXIF, IPTC, XMP)
    
    #### Archives and Compressed Files
    - ZIP, TAR, GZ archives
    - LHA compression format
    - Nested archive extraction
    
    #### Web and Markup
    - HTML, XHTML with XPath support
    - XML documents
    - JSON and structured data
    
    #### Media Files
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
Back to top