Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 14 for validateInputStream (0.14 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/AbstractExtractorTest.java

            public void testValidateInputStream(final InputStream in) {
                validateInputStream(in);
            }
        }
    
        private TestExtractor extractor;
    
        @Override
        protected void setUp() throws Exception {
            super.setUp();
            extractor = new TestExtractor();
        }
    
        /**
         * Test that validateInputStream accepts non-null input streams.
         */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 8.4K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/EXTRACTOR_TESTS_README.md

    **Key Test Areas**:
    - Resource closure on successful extraction (MS Office extractors)
    - Resource closure on failed extraction
    - Improved error messages with context
    - Input validation using `validateInputStream()`
    
    **Covered Extractors**:
    - MsWordExtractor
    - MsExcelExtractor
    - MsPowerPointExtractor
    - TextExtractor
    
    **Test Count**: 8 tests
    
    **Key Scenarios**:
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Wed Nov 19 08:55:01 UTC 2025
    - 5.7K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/FilenameExtractor.java

         * @throws ExtractException if an unexpected error occurs during extraction
         */
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            validateInputStream(in);
            try {
                final String content = params != null ? params.getOrDefault(ExtractData.RESOURCE_NAME_KEY, StringUtil.EMPTY) : StringUtil.EMPTY;
                return new ExtractData(content);
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Wed Nov 19 08:55:01 UTC 2025
    - 2.7K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPowerPointExtractor.java

         * @param params The parameters.
         * @return The extracted data.
         */
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            validateInputStream(in);
            try (final HSLFSlideShow slideShow = new HSLFSlideShow(in);
                    final SlideShowExtractor<HSLFShape, HSLFTextParagraph> extractor = new SlideShowExtractor<>(slideShow)) {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 2K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TextExtractor.java

         */
        public TextExtractor() {
            super();
        }
    
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            validateInputStream(in);
            try {
                final String content = new String(InputStreamUtil.getBytes(in), getEncoding());
                return new ExtractData(content);
            } catch (final Exception e) {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Dec 11 08:38:29 UTC 2025
    - 2K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsExcelExtractor.java

         * @param params The parameters.
         * @return The extracted data.
         */
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            validateInputStream(in);
            try (final HSSFWorkbook workbook = new HSSFWorkbook(in);
                    final org.apache.poi.hssf.extractor.ExcelExtractor excelExtractor =
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java

         * @param params The parameters.
         * @return The extracted data.
         */
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            validateInputStream(in);
            try (final org.apache.poi.hwpf.extractor.WordExtractor wordExtractor = new org.apache.poi.hwpf.extractor.WordExtractor(in)) {
                return new ExtractData(wordExtractor.getText());
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Wed Nov 19 08:55:01 UTC 2025
    - 1.7K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractor.java

         */
        public ZipExtractor() {
            super();
        }
    
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            validateInputStream(in);
    
            final MimeTypeHelper mimeTypeHelper = getMimeTypeHelper();
            final ExtractorFactory extractorFactory = getExtractorFactory();
            final StringBuilder buf = new StringBuilder(1000);
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Dec 11 08:38:29 UTC 2025
    - 4.8K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TarExtractor.java

         */
        public TarExtractor() {
            super();
        }
    
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            validateInputStream(in);
    
            final MimeTypeHelper mimeTypeHelper = getMimeTypeHelper();
            final ExtractorFactory extractorFactory = getExtractorFactory();
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Dec 11 08:38:29 UTC 2025
    - 5.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractExtractor.java

         * This is a common validation performed by most extractors.
         *
         * @param in The input stream to validate
         * @throws CrawlerSystemException if the input stream is null
         */
        protected void validateInputStream(final InputStream in) {
            if (in == null) {
                throw new CrawlerSystemException("The inputstream is null.");
            }
        }
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Wed Nov 19 08:55:01 UTC 2025
    - 4.6K bytes
    - Viewed (0)
Back to top