Search Options

Results per page
Sort
Preferred Languages
Advance

Results 31 - 40 of 44 for Extract (0.04 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPublisherExtractor.java

    public class MsPublisherExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsPublisherExtractor instance.
         */
        public MsPublisherExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Publisher input stream.
         * @param in The input stream.
         * @param params The parameters.
         * @return The extracted data.
         */
        @Override
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/XmlExtractor.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.util.regex.Pattern;
    
    /**
     * Extracts text content from XML documents.
     */
    public class XmlExtractor extends AbstractXmlExtractor {
    
        /**
         * Creates a new XmlExtractor instance.
         */
        public XmlExtractor() {
            super();
        }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TextExtractor.java

    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Extracts text content from an input stream as plain text.
     */
    public class TextExtractor extends AbstractExtractor {
    
        /**
         * The encoding for text.
         */
        protected String encoding = Constants.UTF_8;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsVisioExtractor.java

     */
    public class MsVisioExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsVisioExtractor instance.
         */
        public MsVisioExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Visio input stream.
         * @param in The input stream.
         * @param params The parameters.
         * @return The extracted data.
         */
        @Override
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/BinaryTransformer.java

     * into a ResultData object, and for retrieving the binary data from an AccessResultData object.
     * It extends the AbstractTransformer class.
     *
     * <p>
     * This transformer extracts the binary content from the response body of a web resource,
     * stores it as a byte array in the ResultData, and provides a method to retrieve this data
     * as a ByteArrayInputStream.
     * </p>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.8K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java

     *
     */
    public class MsWordExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsWordExtractor instance.
         */
        public MsWordExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Word input stream.
         * @param in The input stream.
         * @param params The parameters.
         * @return The extracted data.
         */
        @Override
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsExcelExtractor.java

     */
    public class MsExcelExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsExcelExtractor instance.
         */
        public MsExcelExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Excel input stream.
         * @param in The input stream.
         * @param params The parameters.
         * @return The extracted data.
         */
        @Override
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/HostIntervalController.java

            super(params);
        }
    
        /**
         * Delays before processing a URL, ensuring that requests to the same host are not made too frequently.
         * This method extracts the host from the URL and enforces a delay based on the configured
         * delayMillisBeforeProcessing parameter.
         *
         * @throws InterruptedRuntimeException if the thread is interrupted during the delay
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/RegexRule.java

     * only one of them (allRequired = false). It also supports a default rule that always matches.
     *
     * <p>
     * The class uses a map of field names to Pattern objects to store the regular expressions.
     * The match method extracts the values of the specified fields from the ResponseData and
     * applies the corresponding regular expressions.
     * </p>
     *
     * <p>
     * Example usage:
     * </p>
     *
     * <pre>
     * {@code
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.2K bytes
    - Viewed (0)
  10. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchDataService.java

                } catch (final Exception e) {
                    throw new OpenSearchAccessException("response: " + response, e);
                }
            }
            return targetList;
        }
    
        /**
         * Extracts a field value from OpenSearch results and converts it to the specified type.
         *
         * @param <T> The target type.
         * @param field The field value from OpenSearch.
         * @param clazz The target class.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 10.9K bytes
    - Viewed (0)
Back to top