- Sort Score
- Result 10 results
- Languages All
Results 11 - 20 of 60 for Extractor (0.05 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractor.java
import org.codelibs.fess.crawler.exception.ExtractException; import org.codelibs.fess.crawler.exception.MaxLengthExceededException; import org.codelibs.fess.crawler.extractor.Extractor; import org.codelibs.fess.crawler.extractor.ExtractorFactory; import org.codelibs.fess.crawler.helper.MimeTypeHelper; import org.codelibs.fess.crawler.util.IgnoreCloseInputStream; import org.slf4j.Logger; import org.slf4j.LoggerFactory;
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 4.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java
dfos = out; CopyUtil.copy(in, out); out.flush(); Extractor extractor = StringUtil.isBlank(mimeType) ? null : extractorFactory.getExtractor(mimeType); if (extractor == null) { final String detectedMimeType = getMimeType(out); extractor = extractorFactory.getExtractor(detectedMimeType);
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sat Oct 12 01:40:57 UTC 2024 - 6.3K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/XmlExtractorTest.java
final InputStream in = ResourceUtil.getResourceAsStream("extractor/test_sjis.xml"); final String content = xmlExtractor.getText(in, null).getContent(); CloseableUtil.closeQuietly(in); logger.info(content); assertTrue(content.contains("ใในใ")); } public void test_getXml_entity() { final InputStream in = ResourceUtil.getResourceAsStream("extractor/test_entity.xml");
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 6.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPowerPointExtractor.java
*/ package org.codelibs.fess.crawler.extractor.impl; import java.io.IOException; import java.io.InputStream; import java.util.Map; import org.apache.poi.hslf.usermodel.HSLFShape; import org.apache.poi.hslf.usermodel.HSLFSlideShow; import org.apache.poi.hslf.usermodel.HSLFTextParagraph; import org.apache.poi.sl.extractor.SlideShowExtractor; import org.codelibs.fess.crawler.entity.ExtractData;
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 1.9K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractorTest.java
// InputStream in = // ResourceUtil.getResourceAsStream("extractor/test_pass.pdf"); // TikaExtractor extractor = // (TikaExtractor) getContainer().getComponent( // "tikaExtractorForPdfPassword"); // Map<String, String> params = new HashMap<String, String>(); // params.put(ExtractData.URL, "http://example.com/test_pass.pdf"); // ExtractData extractData = extractor.getText(in, params);
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 30.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractor.java
import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.ExtractException; import org.codelibs.fess.crawler.extractor.Extractor; import org.codelibs.fess.crawler.extractor.ExtractorFactory; import org.codelibs.fess.crawler.helper.MimeTypeHelper; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import jakarta.mail.Address; import jakarta.mail.BodyPart;
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:47:32 UTC 2024 - 10.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java
/** * Gets a text from .doc file. * * @author shinsuke * */ public class MsWordExtractor extends AbstractExtractor { /* * (non-Javadoc) * * @see org.codelibs.fess.crawler.extractor.Extractor#getText(java.io.InputStream, * java.util.Map) */ @Override public ExtractData getText(final InputStream in, final Map<String, String> params) { if (in == null) {
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 1.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsExcelExtractor.java
* * @author shinsuke * */ public class MsExcelExtractor extends AbstractExtractor { /* * (non-Javadoc) * * @see * org.codelibs.fess.crawler.extractor.impl.Extractor#getText(java.io.InputStream, * java.util.Map) */ @Override public ExtractData getText(final InputStream in, final Map<String, String> params) { if (in == null) {
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 1.8K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractorTest.java
private TestApiExtractorServer server; private ApiExtractor extractor; @Override protected void setUp() throws Exception { super.setUp(); server = new TestApiExtractorServer(port); server.start(); extractor = new ApiExtractor(); extractor.setUrl("http://127.0.0.1:" + port + "/"); extractor.init(); } @Override
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 5.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/TextTransformer.java
import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.CrawlingAccessException; import org.codelibs.fess.crawler.extractor.Extractor; import org.codelibs.fess.crawler.extractor.ExtractorFactory; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import jakarta.annotation.Resource; /** * @author shinsuke * */
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:47:32 UTC 2024 - 5.2K bytes - Viewed (0)