Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 4 of 4 for AbstractXmlExtractor (0.06 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

     * It handles encoding detection, HTML entity unescaping, and tag-based content extraction.
     *
     */
    public abstract class AbstractXmlExtractor extends AbstractExtractor {
    
        /**
         * Logger for this class.
         */
        protected static final Logger logger = LogManager.getLogger(AbstractXmlExtractor.class);
    
        /**
         * UTF-7 Byte Order Mark definition.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/XmlExtractor.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.util.regex.Pattern;
    
    /**
     * Extracts text content from XML documents.
     */
    public class XmlExtractor extends AbstractXmlExtractor {
    
        /**
         * Creates a new XmlExtractor instance.
         */
        public XmlExtractor() {
            super();
        }
    
        /**
         * Pattern for XML encoding.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

         *
         * @see
         * org.codelibs.fess.crawler.extractor.impl.AbstractXmlExtractor#getEncodingPattern()
         */
        @Override
        protected Pattern getEncodingPattern() {
            return metaCharsetPattern;
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.extractor.impl.AbstractXmlExtractor#getTagPattern()
         */
        @Override
        protected Pattern getTagPattern() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java

         *
         * @see
         * org.codelibs.fess.crawler.extractor.impl.AbstractXmlExtractor#getEncodingPattern()
         */
        @Override
        protected Pattern getEncodingPattern() {
            return metaCharsetPattern;
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.extractor.impl.AbstractXmlExtractor#getTagPattern()
         */
        @Override
        protected Pattern getTagPattern() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
Back to top