Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 18 for AbstractExtractor (0.07 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractExtractor.java

     * </p>
     *
     */
    public abstract class AbstractExtractor implements Extractor {
    
        /** The crawler container. */
        @Resource
        protected CrawlerContainer crawlerContainer;
    
        /**
         * Constructs a new AbstractExtractor.
         */
        public AbstractExtractor() {
            // NOP
        }
    
        /**
         * Registers this extractor with the ExtractorFactory.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java

    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from .doc file.
     *
     * @author shinsuke
     *
     */
    public class MsWordExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsWordExtractor instance.
         */
        public MsWordExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Word input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsExcelExtractor.java

    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from .xls file.
     *
     * @author shinsuke
     *
     */
    public class MsExcelExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsExcelExtractor instance.
         */
        public MsExcelExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Excel input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/FilenameExtractor.java

    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Extracts the filename from the parameters.
     */
    public class FilenameExtractor extends AbstractExtractor {
    
        /**
         * Constructs a new FilenameExtractor.
         */
        public FilenameExtractor() {
            // Default constructor
        }
    
        /**
         * Extracts the filename from the parameters.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsVisioExtractor.java

    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from . file.
     *
     * @author shinsuke
     *
     */
    public class MsVisioExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsVisioExtractor instance.
         */
        public MsVisioExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Visio input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPowerPointExtractor.java

    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Extracts text content from Microsoft PowerPoint documents.
     */
    public class MsPowerPointExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsPowerPointExtractor instance.
         */
        public MsPowerPointExtractor() {
            super();
        }
    
        /**
         * Extracts text from the PowerPoint input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.1K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TextExtractor.java

    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Extracts text content from an input stream as plain text.
     */
    public class TextExtractor extends AbstractExtractor {
    
        /**
         * The encoding for text.
         */
        protected String encoding = Constants.UTF_8;
    
        /**
         * Creates a new TextExtractor instance.
         */
        public TextExtractor() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPublisherExtractor.java

    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from . file.
     *
     * @author shinsuke
     *
     */
    public class MsPublisherExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsPublisherExtractor instance.
         */
        public MsPublisherExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Publisher input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractor.java

     * This extractor can extract text content from files within LHA archives
     * by using appropriate extractors for each contained file type.
     *
     * @author shinsuke
     */
    public class LhaExtractor extends AbstractExtractor {
        /** Logger for this class. */
        private static final Logger logger = LogManager.getLogger(LhaExtractor.class);
    
        /** Maximum content size for extraction. -1 means no limit. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5.8K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractor.java

    import org.codelibs.fess.crawler.util.IgnoreCloseInputStream;
    
    import jakarta.annotation.Resource;
    
    /**
     * Extracts text content from ZIP archives.
     */
    public class ZipExtractor extends AbstractExtractor {
        private static final Logger logger = LogManager.getLogger(ZipExtractor.class);
    
        /**
         * The archive stream factory.
         */
        @Resource
        protected ArchiveStreamFactory archiveStreamFactory;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
Back to top