- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 49 for ExtractData (0.78 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ExtractData.java
protected String content; /** * Constructs a new ExtractData. */ public ExtractData() { // Default constructor } /** * Constructs a new ExtractData with the specified content. * * @param content the content to set */ public ExtractData(final String content) { this.content = content; } /**Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 3.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java
throw exceptionSet.iterator().next(); } writer.flush(); final ExtractData extractData = new ExtractData(writer.toString()); extractMetadata(document, extractData); return extractData; } catch (final Exception e) { throw new ExtractException(e); } } /**
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Nov 23 12:19:14 UTC 2025 - 12.8K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractorTest.java
final ExtractData extractData = tikaExtractor.getText(in, null); final String content = extractData.getContent(); CloseableUtil.closeQuietly(in); logger.info(content); assertTrue(content.contains("テスト")); for (final String key : extractData.getKeySet()) { logger.info("{}={}", key, String.join("|", extractData.getValues(key))); }
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 30.6K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/MarkdownExtractorTest.java
final ExtractData extractData = markdownExtractor.getText(in, null); CloseableUtil.closeQuietly(in); // Verify front matter metadata final String[] titles = extractData.getValues("frontmatter.title"); assertNotNull(titles); assertEquals("Sample Markdown Document", titles[0]); final String[] authors = extractData.getValues("frontmatter.author");
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Mon Nov 24 03:59:47 UTC 2025 - 6.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/FilenameExtractor.java
* @param params The parameters map, expected to contain ExtractData.RESOURCE_NAME_KEY * @return An ExtractData object containing the filename as content, or empty string if not found * @throws CrawlerSystemException if the input stream is null * @throws ExtractException if an unexpected error occurs during extraction */ @Override public ExtractData getText(final InputStream in, final Map<String, String> params) {Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Wed Nov 19 08:55:01 UTC 2025 - 2.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java
try { final ExtractData extractData = new ExtractData( StreamUtil.stream(getStringsByXPath(document, contentXpath)).get(stream -> stream.collect(Collectors.joining(" ")))); metadataXpathMap.entrySet().stream().forEach(e -> { extractData.putValues(e.getKey(), getStringsByXPath(document, e.getValue())); }); return extractData; } finally {Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Oct 04 08:47:19 UTC 2025 - 9.3K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/entity/ExtractDataTest.java
} public void test_usingPredefinedConstants() { // Test using predefined constants ExtractData data = new ExtractData(); data.putValue(ExtractData.RESOURCE_NAME_KEY, "test.pdf"); data.putValue(ExtractData.URL, "https://example.com/test.pdf"); data.putValues(ExtractData.FILE_PASSWORDS, new String[] { "pass1", "pass2" });Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Mon Nov 24 03:59:47 UTC 2025 - 9.9K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/JodExtractorTest.java
Map<String, String> params = new HashMap<String, String>(); params.put("resourceName", "test.odt"); ExtractData extractData = jodExtractor.getText(in, params); String content = extractData.getContent(); CloseableUtil.closeQuietly(in); logger.info(content); assertTrue(content.contains("テスト")); }
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 9.5K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractorTest.java
final ExtractData extractData = pdfExtractor.getText(in, null); final String content = extractData.getContent(); CloseableUtil.closeQuietly(in); logger.info(content); assertTrue(content.contains("テスト")); assertEquals("Writer", extractData.getValues("Creator")[0]); assertEquals("OpenOffice.org 3.0", extractData.getValues("Producer")[0]);
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 7.6K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/transformer/AbstractFessFileTransformer.java
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Nov 28 16:29:12 UTC 2025 - 25.7K bytes - Viewed (0)