Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 65 for extraction (0.03 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TextExtractor.java

            } catch (final Exception e) {
                throw new ExtractException(e);
            }
        }
    
        /**
         * Returns the encoding used for text extraction.
         * @return the encoding
         */
        public String getEncoding() {
            return encoding;
        }
    
        /**
         * Sets the encoding.
         * @param encoding The encoding to set.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractExtractor.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.File;
    import java.io.IOException;
    import java.util.List;
    
    import org.codelibs.fess.crawler.container.CrawlerContainer;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

            this.propertyMap = propertyMap;
        }
    
        /**
         * Gets the map of child URL extraction rules.
         *
         * @return the child URL rule map
         */
        public Map<String, String> getChildUrlRuleMap() {
            return childUrlRuleMap;
        }
    
        /**
         * Sets the map of child URL extraction rules.
         *
         * @param childUrlRuleMap the child URL rule map to set
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 28.5K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

            return htmlTagPattern;
        }
    
        /**
         * Gets the pattern used for extracting charset from meta tags.
         *
         * @return the meta charset pattern
         */
        public Pattern getMetaCharsetPattern() {
            return metaCharsetPattern;
        }
    
        /**
         * Sets the pattern used for extracting charset from meta tags.
         *
         * @param metaCharsetPattern the meta charset pattern to set
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java

            this.propertyMap = propertyMap;
        }
    
        /**
         * Gets the pattern for extracting charset from meta tags.
         *
         * @return the meta charset pattern
         */
        public Pattern getMetaCharsetPattern() {
            return metaCharsetPattern;
        }
    
        /**
         * Sets the pattern for extracting charset from meta tags.
         *
         * @param metaCharsetPattern the meta charset pattern to set
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractor.java

         *
         * @param in the input stream to extract text from
         * @param params additional parameters
         * @return the extracted data
         * @throws ExtractException if extraction fails
         */
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            if (logger.isDebugEnabled()) {
                logger.debug("Accessing {}", url);
            }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 12.2K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractor.java

    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.ExtractException;
    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    import org.codelibs.fess.crawler.helper.MimeTypeHelper;
    
    import jakarta.mail.Address;
    import jakarta.mail.BodyPart;
    import jakarta.mail.Header;
    import jakarta.mail.Message;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.6K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb1/SmbClient.java

     * to interact with SMB resources.
     *
     * <p>
     * This client supports authentication, content retrieval, and metadata extraction from SMB files.
     * It handles file access, directory listing, and access control entries (ACEs) processing.
     * </p>
     *
     * <p>
     * The class provides methods to:
     * </p>
     * <ul>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Sep 18 09:30:45 UTC 2025
    - 23K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb/SmbClient.java

     * to interact with SMB resources.
     *
     * <p>
     * This client supports authentication, content retrieval, and metadata extraction from SMB files.
     * It handles file access, directory listing, and access control entries (ACEs) processing.
     * </p>
     *
     * <p>
     * The class provides methods to:
     * </p>
     * <ul>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Sep 18 09:30:45 UTC 2025
    - 22.5K bytes
    - Viewed (3)
  10. src/main/java/org/codelibs/fess/suggest/util/SuggestUtil.java

            return id;
        }
    
        /**
         * Parses the given query string and returns an array of keywords.
         *
         * @param q the query string to be parsed
         * @param field the field to be used for keyword extraction
         * @return an array of keywords extracted from the query string, or an empty array if the number of keywords exceeds the maximum allowed or if any keyword exceeds the maximum length
         */
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Mon Sep 01 13:33:03 UTC 2025
    - 17.4K bytes
    - Viewed (0)
Back to top