Search Options

Results per page
Sort
Preferred Languages
Advance

Results 21 - 28 of 28 for extractPath (0.14 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

                return createExtractData(content);
            } catch (final Exception e) {
                throw new ExtractException(e);
            }
        }
    
        protected ExtractData createExtractData(final String content) {
            return new ExtractData(extractString(content));
        }
    
        protected String getEncoding(final BufferedInputStream bis) {
            final byte[] b = new byte[preloadSizeForCharset];
            try {
    Registered: Wed Jun 12 15:17:51 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 6.5K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/Extractor.java

     */
    package org.codelibs.fess.crawler.extractor;
    
    import java.io.InputStream;
    import java.util.Map;
    
    import org.codelibs.fess.crawler.entity.ExtractData;
    
    /**
     * @author shinsuke
     *
     */
    public interface Extractor {
    
        ExtractData getText(InputStream in, Map<String, String> params);
    
    Registered: Wed Jun 12 15:17:51 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 905 bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractorTest.java

            final String content = ATTR_NAME + "," + testStr;
            final Map<String, String> params = new HashMap<String, String>();
            //final ExtractData text = extractor.getText(new ByteArrayInputStream(FileUtils.readFileToByteArray(new File(filePath))), params);
            final ExtractData text = extractor.getText(new ByteArrayInputStream(testStr.getBytes()), params);
            assertEquals(content, text.getContent());
        }
    
    Registered: Wed Jun 12 15:17:51 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 5.4K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractorTest.java

    import java.io.InputStream;
    
    import org.codelibs.core.io.CloseableUtil;
    import org.codelibs.core.io.ResourceUtil;
    import org.codelibs.fess.crawler.container.StandardCrawlerContainer;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.dbflute.utflute.core.PlainTestCase;
    import org.slf4j.Logger;
    import org.slf4j.LoggerFactory;
    
    /**
     * @author shinsuke
     *
     */
    Registered: Wed Jun 12 15:17:51 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 3.7K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/ExtractorFactoryTest.java

    import java.io.InputStream;
    import java.util.ArrayList;
    import java.util.List;
    import java.util.Map;
    
    import org.codelibs.fess.crawler.container.StandardCrawlerContainer;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.extractor.impl.LhaExtractor;
    import org.codelibs.fess.crawler.extractor.impl.PasswordBasedExtractor;
    import org.codelibs.fess.crawler.extractor.impl.PdfExtractor;
    Registered: Wed Jun 12 15:17:51 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 5.3K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/TextTransformer.java

            }
            final Extractor extractor = extractorFactory.getExtractor(responseData.getMimeType());
            final Map<String, String> params = new HashMap<>();
            params.put(ExtractData.RESOURCE_NAME_KEY, getResourceName(responseData));
            params.put(ExtractData.CONTENT_TYPE, responseData.getMimeType());
            String content = null;
            try (final InputStream in = responseData.getResponseBody()) {
    Registered: Wed Jun 12 15:17:51 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 5.2K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java

    import org.codelibs.core.io.CopyUtil;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.container.CrawlerContainer;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    import org.codelibs.fess.crawler.exception.MaxLengthExceededException;
    Registered: Wed Jun 12 15:17:51 UTC 2024
    - Last Modified: Thu Mar 14 13:56:25 UTC 2024
    - 6.3K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java

    import java.util.regex.Pattern;
    
    import javax.annotation.Resource;
    import javax.xml.xpath.XPathNodes;
    
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    import org.codelibs.fess.crawler.util.XPathAPI;
    import org.codelibs.nekohtml.parsers.DOMParser;
    Registered: Wed Jun 12 15:17:51 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 7K bytes
    - Viewed (0)
Back to top