Search Options

Display Count
Sort
Preferred Language
Advanced Search

Results 1 - 6 of 6 for ExtractorFactory (0.21 seconds)

  1. src/main/java/org/codelibs/fess/crawler/transformer/FessFileTransformer.java

        @Override
        protected Extractor getExtractor(final ResponseData responseData) {
            final ExtractorFactory extractorFactory = ComponentUtil.getExtractorFactory();
            if (extractorFactory == null) {
                throw new FessSystemException("Could not find extractorFactory.");
            }
            final Extractor extractor = extractorFactory.getExtractor(responseData.getMimeType());
            if (logger.isDebugEnabled()) {
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 3.5K bytes
    - Click Count (0)
  2. src/main/java/org/codelibs/fess/crawler/transformer/FessStandardTransformer.java

        @Override
        protected Extractor getExtractor(final ResponseData responseData) {
            final ExtractorFactory extractorFactory = ComponentUtil.getExtractorFactory();
            if (extractorFactory == null) {
                throw new FessSystemException("Could not find extractorFactory.");
            }
            Extractor extractor = extractorFactory.getExtractor(responseData.getMimeType());
            if (extractor == null) {
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 3.8K bytes
    - Click Count (0)
  3. README.md

        filter.addExclude(".*\\.(css|js|png|jpg|gif)$");
    });
    
    // Configure content extraction
    container.singleton("tikaExtractor", TikaExtractor.class);
    container.singleton("extractorFactory", ExtractorFactory.class, factory -> {
        factory.addExtractor("text/html", container.getComponent("tikaExtractor"));
        factory.addExtractor("application/pdf", container.getComponent("tikaExtractor"));
    });
    
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Sun Aug 31 05:32:52 GMT 2025
    - 15.3K bytes
    - Click Count (0)
  4. src/main/java/org/codelibs/fess/util/ComponentUtil.java

    import org.codelibs.fess.crawler.client.CrawlerClientCreator;
    import org.codelibs.fess.crawler.client.CrawlerClientFactory;
    import org.codelibs.fess.crawler.entity.OpenSearchAccessResult;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    import org.codelibs.fess.crawler.service.DataService;
    import org.codelibs.fess.dict.DictionaryManager;
    import org.codelibs.fess.ds.DataStoreFactory;
    import org.codelibs.fess.exception.ContainerNotAvailableException;
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Sat Mar 28 06:59:19 GMT 2026
    - 30.9K bytes
    - Click Count (0)
  5. CLAUDE.md

    ├── fess-crawler-lasta/        # LastaFlute DI integration
    └── fess-crawler-opensearch/   # OpenSearch backend
    ```
    
    ### Key Design Patterns
    
    - **Factory**: `CrawlerClientFactory`, `ExtractorFactory` - protocol/format-specific component selection
    - **Strategy**: `CrawlerClient`, `Extractor`, `Transformer` - pluggable implementations
    - **Builder**: `RequestDataBuilder`, `ExtractorBuilder` - fluent construction
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Thu Mar 12 03:39:20 GMT 2026
    - 8.1K bytes
    - Click Count (0)
  6. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    		<property name="officeManager">
    			@org.jodconverter.local.office.LocalOfficeManager@.builder().portNumbers(12002).build()
    		</property>
    	</component>
    	-->
    
    	<component name="extractorFactory"
    		class="org.codelibs.fess.crawler.extractor.ExtractorFactory">
    		<postConstruct name="addExtractor">
    			<arg>[
    				"application/xml",
    				"application/xhtml+xml",
    				"application/rdf+xml",
    				"application/x-freemind",
    				"text/xml"
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Wed Feb 11 01:15:55 GMT 2026
    - 50.4K bytes
    - Click Count (0)
Back to Top