Search Options

Results per page
Sort
Preferred Languages
Advance

Results 31 - 40 of 51 for getExt (0.14 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractorTest.java

            final Map<String, String> params = new HashMap<String, String>();
            //final ExtractData text = extractor.getText(new ByteArrayInputStream(FileUtils.readFileToByteArray(new File(filePath))), params);
            final ExtractData text = extractor.getText(new ByteArrayInputStream(testStr.getBytes()), params);
            assertEquals(content, text.getContent());
        }
    
        // TODO other tests
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 5.4K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java

            extensionMap.put(inExt, outExt);
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.extractor.Extractor#getText(java.io.InputStream,
         * java.util.Map)
         */
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            if (in == null) {
                throw new CrawlerSystemException("in is null.");
            }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractorTest.java

            final String content = pdfExtractorForPdfPassword.getText(in, params).getContent();
            CloseableUtil.closeQuietly(in);
            logger.info(content);
            assertTrue(content.contains("ใƒ†ใ‚นใƒˆ"));
        }
    
        public void test_getText_null() {
            try {
                pdfExtractor.getText(null, null);
                fail();
            } catch (final CrawlerSystemException e) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 7.6K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/FilenameExtractor.java

         * @param params The parameters, expected to contain ExtractData.RESOURCE_NAME_KEY.
         * @return An ExtractData object containing the filename as content.
         */
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            if (in == null) {
                throw new CrawlerSystemException("The inputstream is null.");
            }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

                logger.debug("supportedTypes: {}", parser.getSupportedTypes(new ParseContext()));
            }
        }
    
        @Override
        public ExtractData getText(final InputStream inputStream, final Map<String, String> params) {
            return getText(inputStream, params, null);
        }
    
        /**
         * Returns an extracted text.
         *
         * @param inputStream An input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/Extractor.java

         *
         * @param in the input stream to extract text from
         * @param params a map of parameters to be used during extraction
         * @return an ExtractData object containing the extracted text
         */
        ExtractData getText(InputStream in, Map<String, String> params);
    
        /**
         * Returns the weight of the extractor.
         * The default implementation returns a weight of 1.
         *
         * @return the weight of the extractor
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.6K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractor.java

         */
        public EmlExtractor() {
            // Default constructor
        }
    
        /* (non-Javadoc)
         * @see org.codelibs.robot.extractor.Extractor#getText(java.io.InputStream, java.util.Map)
         */
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            final Properties props = new Properties(mailProperties);
            if (params != null) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.6K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/CommandExtractor.java

         */
        public CommandExtractor() {
            // NOP
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.extractor.Extractor#getText(java.io.InputStream,
         * java.util.Map)
         */
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            final String resourceName = params == null ? null : params.get(ExtractData.RESOURCE_NAME_KEY);
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 16K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java

                        }
                    });
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.extractor.Extractor#getText(java.io.InputStream,
         * java.util.Map)
         */
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            if (in == null) {
                throw new CrawlerSystemException("The inputstream is null.");
            }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/TextTransformer.java

            params.put(ExtractData.CONTENT_TYPE, responseData.getMimeType());
            String content = null;
            try (final InputStream in = responseData.getResponseBody()) {
                content = extractor.getText(in, params).getContent();
            } catch (final Exception e) {
                throw new CrawlingAccessException("Could not extract data.", e);
            }
    
            final ResultData resultData = new ResultData();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
Back to top