Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 36 for ExtractData (0.04 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TextExtractor.java

         */
        public TextExtractor() {
            super();
        }
    
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            if (in == null) {
                throw new CrawlerSystemException("The inputstream is null.");
            }
            try {
                return new ExtractData(new String(InputStreamUtil.getBytes(in), getEncoding()));
            } catch (final Exception e) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java

     * <pre>
     * {@code
     * try (InputStream in = new FileInputStream("example.pdf")) {
     *     ExtractData extractData = new ExtractorBuilder(crawlerContainer, in, new HashMap<>())
     *         .mimeType("application/pdf")
     *         .filename("example.pdf")
     *         .maxContentLength(1024 * 1024)
     *         .extract();
     *
     *     String content = extractData.getContent();
     *     // Process the extracted content
     * } catch (IOException e) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.1K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/CommandExtractor.java

                executeCommand(inputFile, outputFile);
    
                final ExtractData extractData = new ExtractData(new String(FileUtil.readBytes(outputFile), outputEncoding));
                if (StringUtil.isNotBlank(resourceName)) {
                    extractData.putValues("resourceName", new String[] { resourceName });
                }
    
                return extractData;
            } catch (final IOException e) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 16K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsVisioExtractor.java

         */
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            if (in == null) {
                throw new CrawlerSystemException("The inputstream is null.");
            }
            try {
                @SuppressWarnings("resource")
                final VisioTextExtractor visioTextExtractor = new VisioTextExtractor(in);
                return new ExtractData(visioTextExtractor.getText());
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractor.java

    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.CloseableUtil;
    import org.codelibs.core.io.CopyUtil;
    import org.codelibs.core.io.FileUtil;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    import org.codelibs.fess.crawler.exception.MaxLengthExceededException;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5.8K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

                throw new ExtractException(e);
            }
        }
    
        /**
         * Creates an ExtractData object from the extracted content.
         * @param content The extracted content.
         * @return The ExtractData object.
         */
        protected ExtractData createExtractData(final String content) {
            return new ExtractData(extractString(content));
        }
    
        /**
         * Detects the encoding of the input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/Extractor.java

         *
         * @param in the input stream to extract text from
         * @param params a map of parameters to be used during extraction
         * @return an ExtractData object containing the extracted text
         */
        ExtractData getText(InputStream in, Map<String, String> params);
    
        /**
         * Returns the weight of the extractor.
         * The default implementation returns a weight of 1.
         *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.6K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.IOException;
    import java.io.InputStream;
    import java.util.Map;
    
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from .doc file.
     *
     * @author shinsuke
     *
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsExcelExtractor.java

    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.IOException;
    import java.io.InputStream;
    import java.util.Map;
    
    import org.apache.poi.hssf.usermodel.HSSFWorkbook;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from .xls file.
     *
     * @author shinsuke
     *
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/MimeTypeHelperImpl.java

            final Map<String, String> params = new HashMap<>();
            params.put(ExtractData.RESOURCE_NAME_KEY, filename);
            return getContentType(is, params);
        }
    
        @Override
        public String getContentType(final InputStream is, final Map<String, String> params) {
            final String filename = params.get(ExtractData.RESOURCE_NAME_KEY);
            if (StringUtil.isEmpty(filename) && is == null) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
Back to top