Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 141 for Patterns (5.21 sec)

  1. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots_wildcard.txt

    # Based on RFC 9309 specification
    
    # Test wildcard patterns
    User-agent: WildcardBot
    Disallow: /*.pdf$
    Disallow: /admin/*.php
    Disallow: /*/private/
    Allow: /public/*.html
    
    # Test end-of-path ($) patterns
    User-agent: EndPathBot
    Disallow: /fish$
    Disallow: /temp$
    Allow: /fishing
    
    # Test complex patterns
    User-agent: ComplexBot
    Disallow: /
    Allow: /$
    Allow: /index.html$
    Allow: /public/
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 13 14:03:41 UTC 2025
    - 910 bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientFactory.java

    /**
     * A factory class for managing and creating crawler clients based on URL patterns.
     * This class implements AutoCloseable to properly handle resource cleanup.
     *
     * <p>The factory maintains a map of regular expression patterns to crawler clients,
     * allowing for URL-based client selection. Clients can be added with specific patterns
     * and optionally at specific positions in the processing order.</p>
     *
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 7.3K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/UrlFilterService.java

        /**
         * Retrieves a list of URL patterns to include for a given session.
         *
         * @param sessionId the ID of the session for which to retrieve the include URL patterns
         * @return a list of compiled regular expression patterns representing the URLs to include
         */
        List<Pattern> getIncludeUrlPatternList(String sessionId);
    
        /**
         * Retrieves a list of URL patterns to be excluded for a given session.
         *
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 3.1K bytes
    - Viewed (0)
  4. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlFilterService.java

        }
    
        /**
         * Gets the list of include URL patterns for the specified session.
         *
         * @param sessionId The session ID.
         * @return The list of compiled include patterns.
         * @throws CrawlerSystemException if the patterns cannot be loaded.
         */
        @Override
        public List<Pattern> getIncludeUrlPatternList(final String sessionId) {
            try {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 20 08:40:57 UTC 2025
    - 9K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/MemoryDataHelper.java

        /** Map of session IDs to include URL patterns for filtering URLs. */
        protected volatile Map<String, List<Pattern>> includeUrlPatternMap = new HashMap<>();
    
        /** Map of session IDs to exclude URL patterns for filtering URLs. */
        protected volatile Map<String, List<Pattern>> excludeUrlPatternMap = new HashMap<>();
    
        /**
         * Creates a new MemoryDataHelper instance.
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.1K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/RegexRule.java

         * @param regex the regular expression pattern
         */
        public void addRule(final String key, final String regex) {
            regexMap.put(key, Pattern.compile(regex));
        }
    
        /**
         * Adds a compiled regular expression rule for the specified field.
         * @param key the field name to match against
         * @param pattern the compiled regular expression pattern
         */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.2K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/UrlFilterServiceImpl.java

         * (java.lang.String)
         */
        /**
         * Retrieves a list of URL patterns to be excluded for a given session.
         * @param sessionId The ID of the session.
         * @return A list of compiled regular expression patterns.
         */
        @Override
        public List<Pattern> getExcludeUrlPatternList(final String sessionId) {
            return dataHelper.getExcludeUrlPatternList(sessionId);
        }
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/app/web/admin/webconfig/CreateForm.java

        public String urls;
    
        /**
         * URL patterns to include during crawling.
         */
        @CustomSize(maxKey = "form.admin.max.input.size")
        public String includedUrls;
    
        /**
         * URL patterns to exclude during crawling.
         */
        @CustomSize(maxKey = "form.admin.max.input.size")
        public String excludedUrls;
    
        /**
         * Document URL patterns to include in search index.
         */
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 5.9K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/core/io/SerializeUtil.java

         * <p>
         * Patterns can be exact class names or use wildcards with '*' at the end.
         * For example: "com.example.*" allows all classes in the com.example package.
         * </p>
         *
         * @param allowedPatterns the patterns of classes to allow
         * @return an ObjectInputFilter configured with the specified patterns
         */
    Registered: Sat Dec 20 08:55:33 UTC 2025
    - Last Modified: Sat Nov 22 11:21:59 UTC 2025
    - 9K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImpl.java

            final List<Pattern> includeList = getUrlFilterService().getIncludeUrlPatternList(sessionId);
            final List<Pattern> excludeList = getUrlFilterService().getExcludeUrlPatternList(sessionId);
    
            if (!includeList.isEmpty()) {
                boolean match = false;
                for (final Pattern pattern : includeList) {
                    final Matcher matcher = pattern.matcher(url);
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.2K bytes
    - Viewed (0)
Back to top