Search Options

Results per page
Sort
Preferred Languages
Advance

Results 21 - 30 of 31 for words (0.02 sec)

  1. src/main/java/org/codelibs/fess/suggest/entity/ElevateWord.java

         */
        protected final List<String> readings;
    
        /**
         * The list of fields associated with the elevate word.
         */
        protected final List<String> fields;
    
        /**
         * The list of tags associated with the elevate word.
         */
        protected final List<String> tags;
    
        /**
         * The list of roles associated with the elevate word.
         */
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Fri Jul 04 14:00:23 UTC 2025
    - 4K bytes
    - Viewed (0)
  2. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    				"application/vnd.ms-wmdrm.lic-resp",
    				"application/vnd.ms-wmdrm.meter-chlg-req",
    				"application/vnd.ms-wmdrm.meter-resp",
    				"application/vnd.ms-word.document.macroenabled.12",
    				"application/vnd.ms-word.template.macroenabled.12",
    				"application/vnd.ms-works",
    				"application/vnd.ms-wpl",
    				"application/vnd.ms-xpsdocument",
    				"application/vnd.mseq",
    				"application/vnd.msign",
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Aug 01 21:40:30 UTC 2020
    - 49K bytes
    - Viewed (0)
  3. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

        <alias type="application/vnd.ms-word"/>
        <_comment>Microsoft Word Document</_comment>
        <tika:link>http://en.wikipedia.org/wiki/.doc</tika:link>
        <tika:uti>com.microsoft.word.doc</tika:uti>
        <magic priority="50">
          <match value="Microsoft\ Word\ 6.0\ Document" type="string" offset="2080"/>
          <match value="Documento\ Microsoft\ Word\ 6" type="string" offset="2080"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java

    public class MsWordExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsWordExtractor instance.
         */
        public MsWordExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Word input stream.
         * @param in The input stream.
         * @param params The parameters.
         * @return The extracted data.
         */
        @Override
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  5. README.md

    - **FTP**: FTP server crawling with authentication
    - **SMB/CIFS**: Windows network shares
    - **Storage**: Cloud storage systems (MinIO, S3-compatible)
    
    ### Content Formats
    
    #### Office Documents
    - Microsoft Office (Word, Excel, PowerPoint)
    - OpenOffice/LibreOffice documents
    - RTF, WordPerfect
    
    #### PDFs and Images
    - PDF documents (text and metadata extraction)
    - Images (JPEG, PNG, GIF, TIFF, BMP)
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/suggest/settings/SuggestSettings.java

     *
     * <p>This class provides methods to initialize settings, get and set individual settings,
     * and manage various types of settings such as array settings, analyzer settings, bad word settings,
     * and elevate word settings.</p>
     *
     * <p>It also includes a nested TimeoutSettings class to manage various timeout configurations.</p>
     *
     * <p>Usage example:</p>
     * <pre>
     * {@code
     * Client client = ...;
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 18.7K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractorTest.java

            assertEquals("こめんと", extractData.getValues("w:Comments")[0]);
            assertEquals("たぐ|さぶたいとる", String.join("|", extractData.getValues("dc:subject")));
            assertEquals("Microsoft Office Word", extractData.getValues("extended-properties:Application")[0]);
            assertEquals("sugaya", extractData.getValues("meta:last-author")[0]);
            assertEquals("太郎", extractData.getValues("dc:creator")[0]);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.6K bytes
    - Viewed (0)
  8. src/test/java/org/codelibs/fess/suggest/converter/ReadingConverterTest.java

            // Test convert with long text
            converter.init();
            StringBuilder sb = new StringBuilder();
            for (int i = 0; i < 1000; i++) {
                sb.append("word").append(i).append(" ");
            }
            String text = sb.toString();
            String field = "content";
    
            List<String> readings = converter.convert(text, field, "en");
    
            assertNotNull(readings);
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Mon Sep 01 13:33:03 UTC 2025
    - 13.5K bytes
    - Viewed (0)
  9. src/test/java/org/codelibs/fess/suggest/util/SuggestUtilTest.java

            // Test empty query
            String[] emptyKeywords = SuggestUtil.parseQuery("", field);
            assertNotNull(emptyKeywords);
            assertEquals(0, emptyKeywords.length);
    
            // Test single word query
            String[] singleKeyword = SuggestUtil.parseQuery("single", field);
            assertNotNull(singleKeyword);
            assertEquals(1, singleKeyword.length);
            assertEquals("single", singleKeyword[0]);
        }
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Mon Sep 01 13:33:03 UTC 2025
    - 18.2K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractorTest.java

            pdfExtractor = container.getComponent("pdfExtractor");
            pdfExtractorForPdfPassword = container.getComponent("pdfExtractorForPdfPassword");
            pdfExtractorForPdfPassword.addPassword(".*test_.*.pdf", "word");
        }
    
        public void test_getText() {
            final InputStream in = ResourceUtil.getResourceAsStream("extractor/test.pdf");
            final ExtractData extractData = pdfExtractor.getText(in, null);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 7.6K bytes
    - Viewed (0)
Back to top