Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 3 of 3 for AbstractXmlExtractor (0.1 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

     * It handles encoding detection, HTML entity unescaping, and tag-based content extraction.
     *
     */
    public abstract class AbstractXmlExtractor extends AbstractExtractor {
    
        /**
         * Logger for this class.
         */
        protected static final Logger logger = LogManager.getLogger(AbstractXmlExtractor.class);
    
        /**
         * UTF-7 Byte Order Mark definition.
         */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 8.6K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

         *
         * @see
         * org.codelibs.fess.crawler.extractor.impl.AbstractXmlExtractor#getEncodingPattern()
         */
        @Override
        protected Pattern getEncodingPattern() {
            return metaCharsetPattern;
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.extractor.impl.AbstractXmlExtractor#getTagPattern()
         */
        @Override
        protected Pattern getTagPattern() {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Oct 04 08:47:19 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java

         *
         * @see
         * org.codelibs.fess.crawler.extractor.impl.AbstractXmlExtractor#getEncodingPattern()
         */
        @Override
        protected Pattern getEncodingPattern() {
            return metaCharsetPattern;
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.extractor.impl.AbstractXmlExtractor#getTagPattern()
         */
        @Override
        protected Pattern getTagPattern() {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Oct 04 08:47:19 UTC 2025
    - 10.4K bytes
    - Viewed (0)
Back to top