Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 4 of 4 for getTagPattern (0.12 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/XmlExtractor.java

         * This pattern is utilized by the extractor to identify and process XML elements.
         *
         * @return the {@link Pattern} instance for XML tag matching
         */
        @Override
        protected Pattern getTagPattern() {
            return xmlTagPattern;
        }
    
        /**
         * Returns the XML encoding pattern.
         * @return The XML encoding pattern.
         */
        public Pattern getXmlEncodingPattern() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

         */
        protected abstract Pattern getEncodingPattern();
    
        /**
         * Returns the pattern used to identify tags in the content.
         * @return The tag pattern.
         */
        protected abstract Pattern getTagPattern();
    
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            if (in == null) {
                throw new CrawlerSystemException("The inputstream is null.");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

            return metaCharsetPattern;
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.extractor.impl.AbstractXmlExtractor#getTagPattern()
         */
        @Override
        protected Pattern getTagPattern() {
            return htmlTagPattern;
        }
    
        /**
         * Gets the pattern used for extracting charset from meta tags.
         *
         * @return the meta charset pattern
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java

            return metaCharsetPattern;
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.extractor.impl.AbstractXmlExtractor#getTagPattern()
         */
        @Override
        protected Pattern getTagPattern() {
            // not used
            return null;
        }
    
        /**
         * Adds a feature to the extractor.
         *
         * @param key   the key of the feature
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
Back to top