Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 22 for pomFile (0.14 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

        /** Pattern for extracting charset from meta tags. */
        protected Pattern metaCharsetPattern = Pattern.compile("<meta.*content\\s*=\\s*['\"].*;\\s*charset=([\\w\\d\\-_]*)['\"]\\s*/?>",
                Pattern.MULTILINE | Pattern.CASE_INSENSITIVE);
    
        /**
         * Pattern for HTML tags.
         */
        protected Pattern htmlTagPattern = Pattern.compile("<[^>]+>");
    
        /** Map of parser features. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  2. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlFilterService.java

                            return getList(OpenSearchUrlFilter.class, key, QueryBuilders.termQuery(FILTER_TYPE, type), null, maxLoadSize, null)
                                    .stream()
                                    .map(f -> Pattern.compile(f.getUrl()))
                                    .collect(Collectors.toList());
                        }
                    });
        }
    
        /**
         * Adds an include URL filter for the specified session.
         *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/RegexRule.java

         * @param key the field name to match against
         * @param regex the regular expression pattern
         */
        public void addRule(final String key, final String regex) {
            regexMap.put(key, Pattern.compile(regex));
        }
    
        /**
         * Adds a compiled regular expression rule for the specified field.
         * @param key the field name to match against
         * @param pattern the compiled regular expression pattern
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.2K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

            }
            final Matcher matcher = getTagPattern().matcher(input);
            final StringBuffer sb = new StringBuffer();
            final Pattern attrPattern = Pattern.compile("\\s[^ ]+=\"([^\"]*)\"");
            while (matcher.find()) {
                final String tagStr = matcher.group();
                final Matcher attrMatcher = attrPattern.matcher(tagStr);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

         *
         * @param directive The directive to add to the robots.txt rules
         */
        public void addDirective(final Directive directive) {
            directiveMap.put(Pattern.compile(directive.getUserAgent().replace("*", ".*"), Pattern.CASE_INSENSITIVE), directive);
        }
    
        /**
         * Adds a sitemap URL to the list of sitemaps.
         *
         * @param url The URL of the sitemap to be added
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

         * If you want to follow a html spec, use 512. */
        protected int preloadSizeForCharset = 2048;
    
        /**
         * Pattern for invalid URLs.
         */
        protected Pattern invalidUrlPattern = Pattern.compile("^\\s*javascript:|" //
                + "^\\s*mailto:|" //
                + "^\\s*irc:|" //
                + "^\\s*skype:|" //
                + "^\\s*about:|" + "^\\s*fscommand:|" //
                + "^\\s*aim:|" //
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 28.5K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java

         * Example: &lt;meta http-equiv="Content-Type" content="text/html; charset=UTF-8"&gt;
         */
        protected Pattern metaCharsetPattern = Pattern.compile("<meta.*content\\s*=\\s*['\"].*;\\s*charset=([\\w\\d\\-_]*)['\"]\\s*/?>",
                Pattern.MULTILINE | Pattern.CASE_INSENSITIVE);
    
        /**
         * Map of features for the DOM parser.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/form/FormScheme.java

         * @param content The content to search.
         * @return The extracted token value.
         */
        protected String getTokenValue(final String tokenPattern, final String content) {
            final Matcher matcher = Pattern.compile(tokenPattern).matcher(content);
            if (matcher.find()) {
                if (logger.isDebugEnabled()) {
                    logger.debug("Matched: {}", matcher.group());
                }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.3K bytes
    - Viewed (1)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java

         */
        public XpathTransformer() {
            super();
        }
    
        private static final Logger logger = LogManager.getLogger(XpathTransformer.class);
    
        private static final Pattern SPACE_PATTERN = Pattern.compile("\\s+", Pattern.MULTILINE);
    
        /**
         * A map of field rules, where the key is the field name and the value is the XPath expression.
         */
        protected Map<String, String> fieldRuleMap = new LinkedHashMap<>();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformer.java

     * </pre>
     */
    public class XmlTransformer extends AbstractTransformer {
        private static final Logger logger = LogManager.getLogger(XmlTransformer.class);
    
        private static final Pattern SPACE_PATTERN = Pattern.compile("\\s+", Pattern.MULTILINE);
    
        /**
         * If true, the parser will be namespace aware.
         */
        protected boolean namespaceAware;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 23.9K bytes
    - Viewed (0)
Back to top