Search Options

Results per page
Sort
Preferred Languages
Advance

Results 71 - 80 of 104 for extraction (0.07 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractorTest.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.IOException;
    import java.io.InputStream;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.ResourceUtil;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 4.6K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractorTest.java

            final BufferedInputStream bis = new BufferedInputStream(in);
            final String encoding = htmlExtractor.getEncoding(bis);
            CloseableUtil.closeQuietly(bis);
            assertEquals("UTF-8", encoding);
        }
    
        public void test_getEncoding_sjis() {
            final InputStream in = ResourceUtil.getResourceAsStream("extractor/test_sjis.html");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 3.7K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TarExtractorTest.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.IOException;
    import java.io.InputStream;
    
    import org.apache.commons.compress.archivers.ArchiveStreamFactory;
    import org.apache.commons.compress.compressors.CompressorStreamFactory;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 3.7K bytes
    - Viewed (0)
  4. fess-crawler-opensearch/src/main/resources/crawler_opensearch.xml

        <include path="crawler/client.xml"/>
        <include path="crawler/rule.xml"/>
        <include path="crawler/filter.xml"/>
        <include path="crawler/interval.xml"/>
        <include path="crawler/extractor.xml"/>
        <include path="crawler/mimetype.xml"/>
        <include path="crawler/encoding.xml"/>
        <include path="crawler/urlconverter.xml"/>
        <include path="crawler/log.xml"/>
        <include path="crawler/sitemaps.xml"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 2.2K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/suggest/index/contents/document/DocumentReader.java

     */
    package org.codelibs.fess.suggest.index.contents.document;
    
    import java.io.Closeable;
    import java.util.Map;
    
    /**
     * Interface for reading documents and extracting their contents into a map.
     * Implementations of this interface should provide the logic for reading
     * documents and converting them into a key-value structure.
     *
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Fri Jul 04 14:00:23 UTC 2025
    - 1.4K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractorTest.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.InputStream;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.CloseableUtil;
    import org.codelibs.core.io.ResourceUtil;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 2.1K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPublisherExtractor.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.IOException;
    import java.io.InputStream;
    import java.util.Map;
    
    import org.apache.poi.hpbf.extractor.PublisherTextExtractor;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  8. src/main/java/jcifs/internal/dfs/DfsReferralResponseBuffer.java

    import java.util.Arrays;
    
    import jcifs.Decodable;
    import jcifs.internal.util.SMBUtil;
    
    /**
     * DFS (Distributed File System) referral response buffer parser.
     * Decodes server responses to DFS referral requests, extracting information about
     * available DFS targets, path consumption details, and referral flags.
     *
     * @author mbechler
     */
    public class DfsReferralResponseBuffer implements Decodable {
    
        /**
    Registered: Sun Sep 07 00:10:21 UTC 2025
    - Last Modified: Sat Aug 16 01:32:48 UTC 2025
    - 3.2K bytes
    - Viewed (0)
  9. .github/workflows/create_issue.js

      if (pr_match_groups.length != 2) {
        console.log(`PR Number not found in ${context.payload.head_commit.message}`);
        throw "Error extracting PR Number from commit message";
      }
      const pr_number = parseInt(pr_match_groups[1]);
      const owner = context.payload.repository.owner.name;
      const repo = context.payload.repository.name;
    Registered: Tue Sep 09 12:39:10 UTC 2025
    - Last Modified: Mon Oct 18 23:04:59 UTC 2021
    - 2.8K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/XmlExtractor.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.util.regex.Pattern;
    
    /**
     * Extracts text content from XML documents.
     */
    public class XmlExtractor extends AbstractXmlExtractor {
    
        /**
         * Creates a new XmlExtractor instance.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
Back to top