Search Options

Results per page
Sort
Preferred Languages
Advance

Results 21 - 30 of 35 for getContent (0.17 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractor.java

                                map.put(ExtractData.RESOURCE_NAME_KEY, filename);
                                buf.append(extractor.getText(new IgnoreCloseInputStream(ais), map).getContent());
                                buf.append('\n');
                            } catch (final Exception e) {
                                if (logger.isDebugEnabled()) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TarExtractor.java

                                map.put(ExtractData.RESOURCE_NAME_KEY, filename);
                                buf.append(extractor.getText(new IgnoreCloseInputStream(ais), map).getContent());
                                buf.append('\n');
                            } catch (final Exception e) {
                                if (logger.isDebugEnabled()) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractorTest.java

        }
    
        public void test_getText() {
            final InputStream in = ResourceUtil.getResourceAsStream("extractor/lha/test.lzh");
            final String content = lhaExtractor.getText(in, null).getContent();
            CloseableUtil.closeQuietly(in);
            logger.info(content);
            assertTrue(content.contains("テスト"));
            assertTrue(content.contains("テキスト"));
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/form/FormScheme.java

                    } else {
                        String content;
                        try {
                            content = new String(InputStreamUtil.getBytes(entity.getContent()), Constants.UTF_8_CHARSET);
                        } catch (final IOException e) {
                            content = e.getMessage();
                        }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.3K bytes
    - Viewed (1)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java

                try (final FileInputStream in = new FileInputStream(outputFile)) {
                    final ExtractData extractData = extractor.getText(in, params);
                    return extractData.getContent();
                } catch (final IOException e) {
                    throw new ExtractException("Could not open " + outputFile.getAbsolutePath(), e);
                }
            }
            try {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/TextTransformer.java

            params.put(ExtractData.CONTENT_TYPE, responseData.getMimeType());
            String content = null;
            try (final InputStream in = responseData.getResponseBody()) {
                content = extractor.getText(in, params).getContent();
            } catch (final Exception e) {
                throw new CrawlingAccessException("Could not extract data.", e);
            }
    
            final ResultData resultData = new ResultData();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java

                        final Map<String, String> map = new HashMap<>();
                        map.put(ExtractData.RESOURCE_NAME_KEY, filename);
                        final String content = extractor.getText(is, map).getContent();
                        writer.write(content);
                        writer.write('\n');
                    } catch (final Exception e) {
                        if (logger.isDebugEnabled()) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.7K bytes
    - Viewed (0)
  8. README.md

        System.out.println("Status: " + accessResult.getHttpStatusCode());
        System.out.println("Content Type: " + accessResult.getMimeType());
        System.out.println("Content: " + accessResult.getContent());
        System.out.println("---");
    });
    
    // Get specific result
    AccessResult result = dataService.getAccessResult(sessionId, url);
    
    // Delete session data
    dataService.delete(sessionId);
    ```
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java

     *         .mimeType("application/pdf")
     *         .filename("example.pdf")
     *         .maxContentLength(1024 * 1024)
     *         .extract();
     *
     *     String content = extractData.getContent();
     *     // Process the extracted content
     * } catch (IOException e) {
     *     // Handle exception
     * }
     * }
     * </pre>
     */
    public class ExtractorBuilder {
    
        /** Logger instance for this class */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

                            }
                        }
                    }
    
                    if (httpEntity != null) {
                        final RobotsTxt robotsTxt = robotsTxtHelper.parse(httpEntity.getContent());
                        if (robotsTxt != null) {
                            final String[] sitemaps = robotsTxt.getSitemaps();
                            if (sitemaps.length > 0) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 52.2K bytes
    - Viewed (0)
Back to top