Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 6 of 6 for offline (0.03 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java

    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.jodconverter.core.office.OfficeException;
    import org.jodconverter.core.office.OfficeManager;
    import org.jodconverter.local.LocalConverter;
    
    import jakarta.annotation.PostConstruct;
    import jakarta.annotation.PreDestroy;
    
    /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  2. README.md

    - **FTP**: FTP server crawling with authentication
    - **SMB/CIFS**: Windows network shares
    - **Storage**: Cloud storage systems (MinIO, S3-compatible)
    
    ### Content Formats
    
    #### Office Documents
    - Microsoft Office (Word, Excel, PowerPoint)
    - OpenOffice/LibreOffice documents
    - RTF, WordPerfect
    
    #### PDFs and Images
    - PDF documents (text and metadata extraction)
    - Images (JPEG, PNG, GIF, TIFF, BMP)
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  3. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

      <mime-type type="application/vnd.ms-excel.addin.macroenabled.12">
        <_comment>Office Open XML Workbook Add-in (macro-enabled)</_comment>
        <glob pattern="*.xlam"/>
        <sub-class-of type="application/x-tika-ooxml"/>
      </mime-type>
    
      <mime-type type="application/vnd.ms-excel.sheet.macroenabled.12">
        <_comment>Office Open XML Workbook (macro-enabled)</_comment>
        <glob pattern="*.xlsm"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractorTest.java

            assertEquals("こめんと", extractData.getValues("w:Comments")[0]);
            assertEquals("たぐ|さぶたいとる", String.join("|", extractData.getValues("dc:subject")));
            assertEquals("Microsoft Office Word", extractData.getValues("extended-properties:Application")[0]);
            assertEquals("sugaya", extractData.getValues("meta:last-author")[0]);
            assertEquals("太郎", extractData.getValues("dc:creator")[0]);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.6K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/JodExtractorTest.java

    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.dbflute.utflute.core.PlainTestCase;
    import org.jodconverter.local.office.LocalOfficeManager;
    
    /**
     * @author shinsuke
     *
     */
    public class JodExtractorTest extends PlainTestCase {
        private static final Logger logger = LogManager.getLogger(JodExtractorTest.class);
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 9.5K bytes
    - Viewed (0)
  6. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    	<!--
    	<component name="jodExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.JodExtractor">
    		<property name="officeManager">
    			@org.jodconverter.local.office.LocalOfficeManager@.builder().portNumbers(12002).build()
    		</property>
    	</component>
    	-->
    
    	<component name="extractorFactory"
    		class="org.codelibs.fess.crawler.extractor.ExtractorFactory">
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Aug 01 21:40:30 UTC 2020
    - 49K bytes
    - Viewed (0)
Back to top