Search Options

Results per page
Sort
Preferred Languages
Advance

Results 51 - 60 of 103 for etext (0.01 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

     * The {@link TikaExtractor} class is responsible for extracting text content and metadata from various file formats
     * using the Apache Tika library. It extends {@link PasswordBasedExtractor} to handle password-protected files.
     * </p>
     *
     * <p>
     * This class provides methods to extract text from an input stream, handling different scenarios such as:
     * </p>
     * <ul>
     *   <li>Normalizing text content</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  2. fess-crawler/src/test/resources/extractor/test.mm

    <map version="0.7.1">
    <node TEXT="&#12479;&#12452;&#12488;&#12523;">
    <node TEXT="&#12486;&#12473;&#12488;" MODIFIED="1237874353965" STYLE="fork"/>
    </node>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 162 bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/service/impl/DataServiceImplTest.java

            assertNotNull(accessResult2);
    
            accessResult2.setMimeType("text/html");
            dataService.update(accessResult2);
    
            final AccessResult accessResult3 = dataService.getAccessResult("id1", "http://www.id1.com/");
            assertNotNull(accessResult3);
            assertEquals("text/html", accessResult3.getMimeType());
    
            dataService.delete("id1");
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 2.8K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/suggest/util/SuggestUtil.java

                return keywords;
            }
            for (final TermQuery tq : termQueryList) {
                final String text = tq.getTerm().text();
                if (0 == text.length() || keywords.contains(text)) {
                    continue;
                }
                keywords.add(text);
            }
            return keywords;
        }
    
        /**
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Mon Sep 01 13:33:03 UTC 2025
    - 17.4K bytes
    - Viewed (1)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java

    import org.jodconverter.core.office.OfficeManager;
    import org.jodconverter.local.LocalConverter;
    
    import jakarta.annotation.PostConstruct;
    import jakarta.annotation.PreDestroy;
    
    /**
     * Extracts text content from various document formats using JODConverter.
     */
    public class JodExtractor extends AbstractExtractor {
        /** Logger for this class. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/fs/FileSystemClientTest.java

            assertNotNull(responseData.getLastModified());
            assertEquals(Constants.GET_METHOD, responseData.getMethod());
            assertEquals("text/plain", responseData.getMimeType());
            assertTrue(responseData.getUrl().endsWith("test/text%203.txt"));
            final String content = new String(InputStreamUtil.getBytes(responseData.getResponseBody()), "UTF-8");
            assertEquals("test3\n", content);
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 8K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TarExtractor.java

            return new ExtractData(getTextInternal(in, mimeTypeHelper, extractorFactory));
        }
    
        /**
         * Returns a text from the input stream.
         *
         * @param in The input stream.
         * @param mimeTypeHelper The mime type helper.
         * @param extractorFactory The extractor factory.
         * @return A text.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/RuleTest.java

            rule.addCondition("mimeType", "text/.*");
    
            ResponseData responseData1 = new ResponseData();
            responseData1.setMimeType("text/html");
            assertTrue(rule.match(responseData1));
    
            ResponseData responseData2 = new ResponseData();
            responseData2.setMimeType("text/plain");
            assertTrue(rule.match(responseData2));
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 22.7K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/suggest/constants/SuggestConstants.java

        public static final String USER_DICT_ENCODING = "fess.user.dict.encoding";
    
        /** The system property name for user dictionary path. */
        public static final String USER_DICT_PATH = "fess.user.dict.path";
    
        /** The text separator. */
        public static final String TEXT_SEPARATOR = " ";
    
        /** The default role for guest users. */
        public static final String DEFAULT_ROLE = "_guest_";
    
        /** The default document type. */
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Fri Jul 04 14:00:23 UTC 2025
    - 1.5K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPublisherExtractor.java

    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from . file.
     *
     * @author shinsuke
     *
     */
    public class MsPublisherExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsPublisherExtractor instance.
         */
        public MsPublisherExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Publisher input stream.
         * @param in The input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
Back to top