Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 10 for Extractor (0.1 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/Extractor.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor;
    
    import java.io.InputStream;
    import java.util.Map;
    
    import org.codelibs.fess.crawler.entity.ExtractData;
    
    /**
     * @author shinsuke
     *
     */
    public interface Extractor {
    
        ExtractData getText(InputStream in, Map<String, String> params);
    
        default int getWeight() {
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Tue Jun 18 05:49:13 UTC 2024
    - 960 bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorFactory.java

        protected Map<String, Extractor> extractorMap = new HashMap<>();
    
        public void addExtractor(final String key, final Extractor extractor) {
            if (StringUtil.isBlank(key)) {
                throw new CrawlerSystemException("The key is null.");
            }
            if (extractor == null) {
                throw new CrawlerSystemException("The extractor is null.");
            }
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Tue Jun 18 05:49:57 UTC 2024
    - 2.9K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java

                dfos = out;
                CopyUtil.copy(in, out);
                out.flush();
    
                Extractor extractor = StringUtil.isBlank(mimeType) ? null : extractorFactory.getExtractor(mimeType);
                if (extractor == null) {
                    final String detectedMimeType = getMimeType(out);
                    extractor = extractorFactory.getExtractor(detectedMimeType);
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sat Oct 12 01:40:57 UTC 2024
    - 6.3K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/crawler/transformer/AbstractFessFileTransformer.java

    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.impl.TikaExtractor;
    import org.codelibs.fess.crawler.transformer.impl.AbstractTransformer;
    import org.codelibs.fess.crawler.util.CrawlingParameterUtil;
    import org.codelibs.fess.crawler.util.FieldConfigs;
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri Oct 11 21:11:58 UTC 2024
    - 23.6K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/ExtractorFactoryTest.java

            final Extractor extractor = new Extractor() {
                public ExtractData getText(final InputStream in, final Map<String, String> params) {
                    return null;
                }
            };
    
            assertNull(extractorFactory.getExtractor("test"));
            extractorFactory.addExtractor("test", extractor);
            assertEquals(extractor, extractorFactory.getExtractor("test"));
        }
    
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Tue Jun 18 05:49:13 UTC 2024
    - 6.5K bytes
    - Viewed (0)
  6. fess-crawler-opensearch/src/main/resources/crawler_opensearch.xml

        <include path="crawler/client.xml"/>
        <include path="crawler/rule.xml"/>
        <include path="crawler/filter.xml"/>
        <include path="crawler/interval.xml"/>
        <include path="crawler/extractor.xml"/>
        <include path="crawler/mimetype.xml"/>
        <include path="crawler/encoding.xml"/>
        <include path="crawler/urlconverter.xml"/>
        <include path="crawler/log.xml"/>
        <include path="crawler/sitemaps.xml"/>
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 2.2K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

    import org.apache.commons.lang3.SystemUtils;
    import org.apache.tika.config.TikaConfig;
    import org.apache.tika.detect.Detector;
    import org.apache.tika.exception.TikaException;
    import org.apache.tika.extractor.EmbeddedDocumentExtractor;
    import org.apache.tika.extractor.ParsingEmbeddedDocumentExtractor;
    import org.apache.tika.io.TemporaryResources;
    import org.apache.tika.io.TikaInputStream;
    import org.apache.tika.metadata.Metadata;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sat Oct 12 01:41:37 UTC 2024
    - 25K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/util/ComponentUtil.java

    import org.codelibs.fess.crawler.client.CrawlerClientCreator;
    import org.codelibs.fess.crawler.client.CrawlerClientFactory;
    import org.codelibs.fess.crawler.entity.EsAccessResult;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    import org.codelibs.fess.crawler.service.DataService;
    import org.codelibs.fess.dict.DictionaryManager;
    import org.codelibs.fess.ds.DataStoreFactory;
    import org.codelibs.fess.es.client.SearchEngineClient;
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Mon Jun 17 13:35:51 UTC 2024
    - 20.2K bytes
    - Viewed (0)
  9. .github/CODEOWNERS

    platforms/enterprise/enterprise-operations/             @gradle/bt-build-scan
    platforms/enterprise/enterprise-plugin-performance/     @gradle/bt-build-scan
    
    # JVM platform
    build-logic/java-api-extractor              @gradle/bt-jvm
    platforms/jvm/                              @gradle/bt-jvm
    subprojects/plugins/                        @gradle/bt-jvm
    
    # JVM testing services also shared by GE testing plugins
    Registered: Wed Nov 06 11:36:14 UTC 2024
    - Last Modified: Thu Oct 24 14:46:27 UTC 2024
    - 10.6K bytes
    - Viewed (0)
  10. impl/maven-core/plugin-manager.txt

    h3. Plugins
    
    * Execution model
    * Metadata model
    * Metadata tooling
     ** Metadata extractor
     ** Metadata reader
     ** Metadata writer
     ** Metadata adapter (if required for the target system)
    * Maven packaging and lifecycle
    * Maven test harness for plugin execution model
    * Eclipse IDE tooling for plugin execution model and metadata model
    
    - we also seem to have information like the plugin lifecycle model that's buried inside the maven execution model
    Registered: Sun Nov 03 03:35:11 UTC 2024
    - Last Modified: Fri Oct 25 12:31:46 UTC 2024
    - 12.9K bytes
    - Viewed (0)
Back to top