Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 4 of 4 for docx (0.01 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/JodExtractorTest.java

        }
    
        public void test_getText_mswordx() {
            InputStream in = ResourceUtil.getResourceAsStream("extractor/msoffice/test.docx");
            Map<String, String> params = new HashMap<String, String>();
            params.put("resourceName", "test.docx");
            ExtractData extractData = jodExtractor.getText(in, params);
            String content = extractData.getContent();
            CloseableUtil.closeQuietly(in);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 9.5K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

    import org.codelibs.fess.crawler.exception.RobotsTxtException;
    
    /**
     * Robots.txt Specifications:
     * <ul>
     * <li><a href=
     * "https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt"
     * >https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt
     * </a></li>
     * </ul>
     *
     * @author bowez
     * @author shinsuke
     *
     */
    public class RobotsTxtHelper {
    
        /** Pattern for parsing user-agent records. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java

    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from .doc file.
     *
     * @author shinsuke
     *
     */
    public class MsWordExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsWordExtractor instance.
         */
        public MsWordExtractor() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractorTest.java

            msWordExtractor = container.getComponent("msWordExtractor");
        }
    
        public void test_getText() {
            final InputStream in = ResourceUtil.getResourceAsStream("extractor/msoffice/test.doc");
            final String content = msWordExtractor.getText(in, null).getContent();
            CloseableUtil.closeQuietly(in);
            logger.info(content);
            assertTrue(content.contains("ใƒ†ใ‚นใƒˆ"));
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 2.1K bytes
    - Viewed (0)
Back to top