- Sort Score
- Result 10 results
- Languages All
Results 11 - 20 of 20 for docx (0.01 sec)
-
fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformerTest.java
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 12.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformer.java
private final Node doc; public DefaultNamespaceContext(final Node doc) { this.doc = doc; } @Override public String getNamespaceURI(final String prefix) { return getNamespaceForPrefix(prefix, doc); }Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 23.9K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformerTest.java
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 13.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java
final PDDocument doc = document; final Set<Exception> exceptionSet = new HashSet<>(); final Thread task = new Thread(() -> { try { stripper.writeText(doc, writer); extractEmbeddedDocuments(doc, writer); extractAnnotations(doc, writer); } catch (final Exception e) {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 12.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java
import org.codelibs.fess.crawler.exception.RobotsTxtException; /** * Robots.txt Specifications: * <ul> * <li><a href= * "https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt" * >https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt * </a></li> * </ul> * * @author bowez * @author shinsuke * */ public class RobotsTxtHelper { /** Pattern for parsing user-agent records. */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 7.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java
import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExtractException; /** * Gets a text from .doc file. * * @author shinsuke * */ public class MsWordExtractor extends AbstractExtractor { /** * Creates a new MsWordExtractor instance. */ public MsWordExtractor() {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.9K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractorTest.java
msWordExtractor = container.getComponent("msWordExtractor"); } public void test_getText() { final InputStream in = ResourceUtil.getResourceAsStream("extractor/msoffice/test.doc"); final String content = msWordExtractor.getText(in, null).getContent(); CloseableUtil.closeQuietly(in); logger.info(content); assertTrue(content.contains("テスト")); }
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 2.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java
* Returns the result data header. * @return The result data header. */ protected String getResultDataHeader() { // TODO: Support other XML header types return "<?xml version=\"1.0\"?>\n<doc>\n"; } /** * Returns the result data body for a single value. * @param name The name of the field. * @param value The value of the field. * @return The result data body. */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 13.1K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/client/http/HcHttpClientTest.java
// public ResponseData call() throws Exception { // String[] urls = // new String[] { // "http://.../", // "http://.../test.pdf", // "http://.../test.doc", // "http://.../test.xls", // "http://.../test.ppt", // "http://.../test.txt", }; // for (String url : urls) { // ResponseData responseData = httpClient.doGet(url);
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 11.7K bytes - Viewed (0) -
fess-crawler-lasta/src/main/resources/crawler/extractor.xml
"application/vnd.sbm.cid", "application/vnd.sbm.mid2", "application/vnd.scribus", "application/vnd.sealed.3df", "application/vnd.sealed.csf", "application/vnd.sealed.doc", "application/vnd.sealed.eml", "application/vnd.sealed.mht", "application/vnd.sealed.net", "application/vnd.sealed.ppt", "application/vnd.sealed.tiff", "application/vnd.sealed.xls",
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Aug 01 21:40:30 UTC 2020 - 49K bytes - Viewed (0)