Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 20 for docx (0.01 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformerTest.java

            final String value = "<?xml version=\"1.0\"?>\n"//
                    + "<doc>\n"//
                    + "<field name=\"title\">タイトル</field>\n"//
                    + "<field name=\"body\">第一章 第一節 ほげほげふがふが LINK 第2章 第2節</field>\n"//
                    + "<field name=\"list\"><list><item>リスト1</item><item>リスト2</item><item>リスト3</item></list></field>\n"//
                    + "</doc>";
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 12.5K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformer.java

            private final Node doc;
    
            public DefaultNamespaceContext(final Node doc) {
                this.doc = doc;
            }
    
            @Override
            public String getNamespaceURI(final String prefix) {
                return getNamespaceForPrefix(prefix, doc);
            }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 23.9K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformerTest.java

            final String value = "<?xml version=\"1.0\"?>\n"//
                    + "<doc>\n"//
                    + "<field name=\"title\">タイトル</field>\n"//
                    + "<field name=\"body\">第一章 第一節 ほげほげふがふが LINK 第2章 第2節</field>\n"//
                    + "<field name=\"list\"><list><item>リスト1</item><item>リスト2</item><item>リスト3</item></list></field>\n"//
                    + "</doc>";
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 13.5K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java

                final PDDocument doc = document;
                final Set<Exception> exceptionSet = new HashSet<>();
                final Thread task = new Thread(() -> {
                    try {
                        stripper.writeText(doc, writer);
                        extractEmbeddedDocuments(doc, writer);
                        extractAnnotations(doc, writer);
                    } catch (final Exception e) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.7K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

    import org.codelibs.fess.crawler.exception.RobotsTxtException;
    
    /**
     * Robots.txt Specifications:
     * <ul>
     * <li><a href=
     * "https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt"
     * >https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt
     * </a></li>
     * </ul>
     *
     * @author bowez
     * @author shinsuke
     *
     */
    public class RobotsTxtHelper {
    
        /** Pattern for parsing user-agent records. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java

    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from .doc file.
     *
     * @author shinsuke
     *
     */
    public class MsWordExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsWordExtractor instance.
         */
        public MsWordExtractor() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractorTest.java

            msWordExtractor = container.getComponent("msWordExtractor");
        }
    
        public void test_getText() {
            final InputStream in = ResourceUtil.getResourceAsStream("extractor/msoffice/test.doc");
            final String content = msWordExtractor.getText(in, null).getContent();
            CloseableUtil.closeQuietly(in);
            logger.info(content);
            assertTrue(content.contains("テスト"));
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 2.1K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java

         * Returns the result data header.
         * @return The result data header.
         */
        protected String getResultDataHeader() {
            // TODO: Support other XML header types
            return "<?xml version=\"1.0\"?>\n<doc>\n";
        }
    
        /**
         * Returns the result data body for a single value.
         * @param name The name of the field.
         * @param value The value of the field.
         * @return The result data body.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.1K bytes
    - Viewed (0)
  9. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/http/HcHttpClientTest.java

        // public ResponseData call() throws Exception {
        // String[] urls =
        // new String[] {
        // "http://.../",
        // "http://.../test.pdf",
        // "http://.../test.doc",
        // "http://.../test.xls",
        // "http://.../test.ppt",
        // "http://.../test.txt", };
        // for (String url : urls) {
        // ResponseData responseData = httpClient.doGet(url);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.7K bytes
    - Viewed (0)
  10. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    				"application/vnd.sbm.cid",
    				"application/vnd.sbm.mid2",
    				"application/vnd.scribus",
    				"application/vnd.sealed.3df",
    				"application/vnd.sealed.csf",
    				"application/vnd.sealed.doc",
    				"application/vnd.sealed.eml",
    				"application/vnd.sealed.mht",
    				"application/vnd.sealed.net",
    				"application/vnd.sealed.ppt",
    				"application/vnd.sealed.tiff",
    				"application/vnd.sealed.xls",
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Aug 01 21:40:30 UTC 2020
    - 49K bytes
    - Viewed (0)
Back to top