- Sort Score
- Result 10 results
- Languages All
Results 51 - 60 of 154 for extracted (3.38 sec)
-
src/main/java/org/codelibs/fess/ldap/LdapManager.java
} consumer.accept(entryDn); } } } } /** * Extracts the role name from an LDAP entry DN. * * @param entryDn the LDAP entry DN * @return the extracted role name, or null if not found */ protected String getSearchRoleName(final String entryDn) { if (entryDn == null) { return null;Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Nov 28 16:29:12 UTC 2025 - 86.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MarkdownExtractor.java
} // Extract links if (extractLinks) { extractLinkMetadata(document, extractData); } return extractData; } catch (final Exception e) { throw new ExtractException("Failed to extract Markdown content", e); } } /** * Extracts YAML front matter metadata from the document. *Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Nov 23 03:46:53 UTC 2025 - 8.2K bytes - Viewed (0) -
fess-crawler-lasta/src/main/resources/crawler/extractor.xml
class="org.codelibs.fess.crawler.extractor.impl.MsPowerPointExtractor" /> <component name="msPublisherExtractor" class="org.codelibs.fess.crawler.extractor.impl.MsPublisherExtractor" /> <component name="msVisioExtractor" class="org.codelibs.fess.crawler.extractor.impl.MsVisioExtractor" /> <component name="pdfExtractor" class="org.codelibs.fess.crawler.extractor.impl.PdfExtractor" /> <component name="lhaExtractor"
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Nov 23 03:46:53 UTC 2025 - 50.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorFactory.java
} if (extractor == null) { throw new CrawlerSystemException("Extractor instance is null. Cannot register null extractor."); } if (extractorMap.containsKey(key)) { final Extractor[] existingExtractors = extractorMap.get(key);Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Nov 23 12:19:14 UTC 2025 - 7.4K bytes - Viewed (0) -
src/main/resources/crawler/extractor+tikaExtractor.xml
"http://dbflute.org/meta/lastadi10.dtd"> <components namespace="fessCrawler"> <include path="crawler/container.xml" /> <component name="tikaExtractor" class="org.codelibs.fess.crawler.extractor.impl.TikaExtractor"> <property name="maxCompressionRatio">2</property> <property name="maxUncompressionSize">10000000</property> </component>
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Sun Aug 25 12:46:12 UTC 2019 - 461 bytes - Viewed (0) -
src/main/resources/fess_config.properties
dc:title=title:string\n\ # html # XPath to extract main content from HTML documents. crawler.document.html.content.xpath=//BODY # XPath to extract language attribute from HTML documents. crawler.document.html.lang.xpath=//HTML/@lang # XPath to extract digest (description) from HTML documents. crawler.document.html.digest.xpath=//META[@name='description']/@content # XPath to extract canonical URL from HTML documents.
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Dec 11 09:47:03 UTC 2025 - 54.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TextExtractor.java
*/ package org.codelibs.fess.crawler.extractor.impl; import java.io.InputStream; import java.util.Map; import org.codelibs.core.io.InputStreamUtil; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.ExtractException; /** * Extracts text content from an input stream as plain text. */
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Thu Dec 11 08:38:29 UTC 2025 - 2K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ArchiveExtractorErrorHandlingTest.java
e.getMessage().contains("TAR") || e.getMessage().contains("extract")); } } /** * Test that ZipExtractor successfully extracts from valid archive. */ public void test_ZipExtractor_validArchive_extractsSuccessfully() { final InputStream in = ResourceUtil.getResourceAsStream("extractor/zip/test.zip"); final ExtractData result = zipExtractor.getText(in, null);
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Mon Nov 24 03:59:47 UTC 2025 - 12.6K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ExtractorResourceManagementTest.java
final AtomicBoolean streamClosed = new AtomicBoolean(false); try (final InputStream originalStream = ResourceUtil.getResourceAsStream("extractor/msoffice/test.xls")) { final InputStream trackableStream = createTrackableInputStream(originalStream, streamClosed); final ExtractData result = extractor.getText(trackableStream, null);
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Mon Nov 24 03:59:47 UTC 2025 - 10.4K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/ExtractorFactoryTest.java
final Extractor extractor = new Extractor() { public ExtractData getText(final InputStream in, final Map<String, String> params) { return null; } }; assertNull(extractorFactory.getExtractor("test")); extractorFactory.addExtractor("test", extractor); assertEquals(extractor, extractorFactory.getExtractor("test")); }Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 6.9K bytes - Viewed (0)