- Sort Score
- Result 10 results
- Languages All
Results 1 - 8 of 8 for Doc (0.01 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformer.java
private final Node doc; public DefaultNamespaceContext(final Node doc) { this.doc = doc; } @Override public String getNamespaceURI(final String prefix) { return getNamespaceForPrefix(prefix, doc); }Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 23.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java
final PDDocument doc = document; final Set<Exception> exceptionSet = new HashSet<>(); final Thread task = new Thread(() -> { try { stripper.writeText(doc, writer); extractEmbeddedDocuments(doc, writer); extractAnnotations(doc, writer); } catch (final Exception e) {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 12.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java
import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExtractException; /** * Gets a text from .doc file. * * @author shinsuke * */ public class MsWordExtractor extends AbstractExtractor { /** * Creates a new MsWordExtractor instance. */ public MsWordExtractor() {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.9K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/suggest/index/SuggestIndexer.java
Registered: Fri Sep 19 09:08:11 UTC 2025 - Last Modified: Thu Aug 07 02:41:28 UTC 2025 - 34.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java
* Returns the result data header. * @return The result data header. */ protected String getResultDataHeader() { // TODO: Support other XML header types return "<?xml version=\"1.0\"?>\n<doc>\n"; } /** * Returns the result data body for a single value. * @param name The name of the field. * @param value The value of the field. * @return The result data body. */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 13.1K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/client/http/HcHttpClientTest.java
// public ResponseData call() throws Exception { // String[] urls = // new String[] { // "http://.../", // "http://.../test.pdf", // "http://.../test.doc", // "http://.../test.xls", // "http://.../test.ppt", // "http://.../test.txt", }; // for (String url : urls) { // ResponseData responseData = httpClient.doGet(url);
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 11.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java
// Text Formats extensionMap.put("odt", "txt"); extensionMap.put("ott", "txt"); extensionMap.put("sxw", "txt"); extensionMap.put("rtf", "txt"); extensionMap.put("doc", "txt"); extensionMap.put("docx", "txt"); extensionMap.put("wpd", "txt"); extensionMap.put("txt", "txt"); extensionMap.put("html", "txt"); // Spreadsheet FormatsRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10.3K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractorTest.java
logger.info(content); assertTrue(content.contains("ใในใ")); } public void test_getTika_msword() { final InputStream in = ResourceUtil.getResourceAsStream("extractor/msoffice/test.doc"); final ExtractData extractData = tikaExtractor.getText(in, null); final String content = extractData.getContent(); CloseableUtil.closeQuietly(in); logger.info(content);
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 30.6K bytes - Viewed (0)