Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 10 for Archive (0.11 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractor.java

        /**
         * Creates a new LhaExtractor instance.
         */
        public LhaExtractor() {
            super();
        }
    
        /**
         * Extracts text content from an LHA archive input stream.
         *
         * @param in the input stream containing the LHA archive
         * @param params extraction parameters
         * @return the extracted text data
         * @throws CrawlerSystemException if the input stream is null
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5.8K bytes
    - Viewed (0)
  2. fess-crawler-lasta/pom.xml

    			</plugin>
    			<plugin>
    				<artifactId>maven-jar-plugin</artifactId>
    				<configuration>
    					<archive>
    						<manifestEntries>
    							<Automatic-Module-Name>org.codelibs.fess.crawler.lasta</Automatic-Module-Name>
    						</manifestEntries>
    					</archive>
    				</configuration>
    			</plugin>
    			<plugin>
    				<groupId>com.mycila</groupId>
    				<artifactId>license-maven-plugin</artifactId>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 2.9K bytes
    - Viewed (0)
  3. fess-crawler-opensearch/pom.xml

    			</plugin>
    			<plugin>
    				<artifactId>maven-jar-plugin</artifactId>
    				<configuration>
    					<archive>
    						<manifestEntries>
    							<Automatic-Module-Name>org.codelibs.fess.crawler.opensearch</Automatic-Module-Name>
    						</manifestEntries>
    					</archive>
    				</configuration>
    			</plugin>
    			<plugin>
    				<groupId>com.mycila</groupId>
    				<artifactId>license-maven-plugin</artifactId>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  4. pom.xml

    			</plugin>
    			<plugin>
    				<artifactId>maven-jar-plugin</artifactId>
    				<configuration>
    					<archive>
    						<manifestEntries>
    							<Automatic-Module-Name>org.codelibs.fess.suggest</Automatic-Module-Name>
    						</manifestEntries>
    					</archive>
    				</configuration>
    			</plugin>
    			<plugin>
    				<groupId>com.mycila</groupId>
    				<artifactId>license-maven-plugin</artifactId>
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sat Sep 06 03:14:57 UTC 2025
    - 4.3K bytes
    - Viewed (0)
  5. fess-crawler/pom.xml

    			</plugin>
    			<plugin>
    				<artifactId>maven-jar-plugin</artifactId>
    				<configuration>
    					<archive>
    						<manifestEntries>
    							<Automatic-Module-Name>org.codelibs.fess.crawler</Automatic-Module-Name>
    						</manifestEntries>
    					</archive>
    				</configuration>
    			</plugin>
    			<plugin>
    				<groupId>com.mycila</groupId>
    				<artifactId>license-maven-plugin</artifactId>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.3K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractor.java

    import jakarta.annotation.Resource;
    
    /**
     * Extracts text content from ZIP archives.
     */
    public class ZipExtractor extends AbstractExtractor {
        private static final Logger logger = LogManager.getLogger(ZipExtractor.class);
    
        /**
         * The archive stream factory.
         */
        @Resource
        protected ArchiveStreamFactory archiveStreamFactory;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TarExtractor.java

    import jakarta.annotation.Resource;
    
    /**
     * Extracts text content from TAR archives.
     */
    public class TarExtractor extends AbstractExtractor {
        private static final Logger logger = LogManager.getLogger(TarExtractor.class);
    
        /**
         * The archive stream factory.
         */
        @Resource
        protected ArchiveStreamFactory archiveStreamFactory;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5K bytes
    - Viewed (0)
  8. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

      <mime-type type="application/java-archive">
        <_comment>Java Archive</_comment>
        <tika:link>http://en.wikipedia.org/wiki/.jar</tika:link>
        <tika:uti>com.sun.java-archive</tika:uti>
        <sub-class-of type="application/zip"/>
        <glob pattern="*.jar"/>
      </mime-type>
    
      <mime-type type="application/vnd.android.package-archive">
        <sub-class-of type="application/java-archive"/>
        <glob pattern="*.apk"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  9. README.md

    #### PDFs and Images
    - PDF documents (text and metadata extraction)
    - Images (JPEG, PNG, GIF, TIFF, BMP)
    - Image metadata (EXIF, IPTC, XMP)
    
    #### Archives and Compressed Files
    - ZIP, TAR, GZ archives
    - LHA compression format
    - Nested archive extraction
    
    #### Web and Markup
    - HTML, XHTML with XPath support
    - XML documents
    - JSON and structured data
    
    #### Media Files
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java

         * <li>yearly</li>
         * <li>never</li>
         * </ul>
         * The value "always" should be used to describe documents that change each
         * time they are accessed. The value "never" should be used to describe
         * archived URLs.
         *
         * Please note that the value of this tag is considered a hint and not a
         * command. Even though search engine crawlers may consider this information
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
Back to top