Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 13 for ketika (6.58 sec)

  1. fess-crawler/pom.xml

    			<artifactId>tika-parser-html-module</artifactId>
    			<version>${tika.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.apache.tika</groupId>
    			<artifactId>tika-parser-image-module</artifactId>
    			<version>${tika.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.apache.tika</groupId>
    			<artifactId>tika-parser-mail-module</artifactId>
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Dec 20 06:34:36 UTC 2025
    - 12.1K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/MimeTypeHelperImpl.java

    import java.io.BufferedInputStream;
    import java.io.IOException;
    import java.io.InputStream;
    import java.util.HashMap;
    import java.util.Map;
    
    import org.apache.tika.metadata.Metadata;
    import org.apache.tika.mime.MediaType;
    import org.apache.tika.mime.MimeTypes;
    import org.apache.tika.mime.MimeTypesFactory;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.entity.ExtractData;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 6.6K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

    import org.apache.logging.log4j.Logger;
    import org.apache.tika.config.TikaConfig;
    import org.apache.tika.detect.Detector;
    import org.apache.tika.exception.TikaException;
    import org.apache.tika.extractor.EmbeddedDocumentExtractor;
    import org.apache.tika.extractor.ParsingEmbeddedDocumentExtractor;
    import org.apache.tika.io.TemporaryResources;
    import org.apache.tika.io.TikaInputStream;
    import org.apache.tika.metadata.Metadata;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 30.8K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/helper/LanguageHelper.java

    import java.util.Arrays;
    import java.util.Map;
    import java.util.stream.Collectors;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.apache.tika.language.detect.LanguageDetector;
    import org.apache.tika.language.detect.LanguageResult;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.mylasta.direction.FessConfig;
    import org.codelibs.fess.util.ComponentUtil;
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 6.9K bytes
    - Viewed (0)
  5. src/main/resources/fess_label_tr.properties

    labels.expires=Son Kullanma
    labels.failureCountThreshold=Hata Sayısı
    labels.fileConfigName=Dosya Tarama Yapılandırma Adı
    labels.fileName=Dosya Adı
    labels.handlerName=İşleyici Adı
    labels.handlerParameter=Parametre
    labels.handlerScript=Betik
    labels.popularWord=Popüler Kelime
    labels.ignoreFailureType=Yok Sayılan Hata Türü
    labels.lastAccessTime=Son Erişim Zamanı
    labels.notificationTo=Bildirim Alıcısı
    labels.num=Sayı
    labels.pn=Sayfa Numarası
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 13 02:21:17 UTC 2025
    - 47K bytes
    - Viewed (0)
  6. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    				"application/x-texinfo",
    				"application/x-tika-msoffice",
    				"application/x-tika-msoffice-embedded",
    				"application/x-tika-msoffice-embedded;format=ole10_native",
    				"application/x-tika-msoffice-embedded;format=comp_obj",
    				"application/x-tika-msworks-spreadsheet",
    				"application/x-tika-ooxml",
    				"application/x-tika-ooxml-protected",
    				"application/x-tika-staroffice",
    				"application/x-uc2-compressed",
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 03:46:53 UTC 2025
    - 50.1K bytes
    - Viewed (0)
  7. pom.xml

    			<groupId>com.ibm.icu</groupId>
    			<artifactId>icu4j</artifactId>
    			<version>${icu4j.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.apache.tika</groupId>
    			<artifactId>tika-langdetect-optimaize</artifactId>
    			<version>${tika.version}</version>
    			<exclusions>
    				<exclusion>
    					<groupId>javax.annotation</groupId>
    					<artifactId>javax.annotation-api</artifactId>
    				</exclusion>
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 20 08:30:43 UTC 2025
    - 49.4K bytes
    - Viewed (0)
  8. CLAUDE.md

    - **Build**: Maven 3.x
    - **License**: Apache 2.0
    - **DI**: LastaFlute DI
    - **Repo**: https://github.com/codelibs/fess-crawler
    
    ### Tech Stack
    
    - **HTTP**: Apache HttpComponents 4.5+
    - **Extraction**: Apache Tika 3.0+, POI 5.3+, PDFBox 3.0+
    - **Testing**: JUnit 4, UTFlute, Mockito 5.7.0
    - **Storage**: In-memory (default), OpenSearch (optional)
    
    ### Protocols
    
    - **HTTP/HTTPS**: Full crawling, cookies, auth, robots.txt
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 28 17:31:34 UTC 2025
    - 10.7K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/crawler/transformer/FessStandardTransformer.java

        public Logger getLogger() {
            return logger;
        }
    
        /**
         * Gets the appropriate extractor for the given response data.
         * Selects an extractor based on the MIME type or falls back to the Tika extractor.
         *
         * @param responseData the response data containing the document to extract
         * @return the extractor instance for processing the document
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 3.8K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/job/CrawlJob.java

            } else {
                cmdList.add("-Dfess.log.level=" + logLevel);
                if ("debug".equalsIgnoreCase(logLevel)) {
                    cmdList.add("-Dorg.apache.tika.service.error.warn=true");
                }
            }
            stream(fessConfig.getJvmCrawlerOptionsAsArray())
                    .of(stream -> stream.filter(StringUtil::isNotBlank).forEach(value -> cmdList.add(value)));
    
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 19.6K bytes
    - Viewed (0)
Back to top