Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 265 for patterns (1.14 sec)

  1. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlFilterService.java

        }
    
        /**
         * Gets the list of include URL patterns for the specified session.
         *
         * @param sessionId The session ID.
         * @return The list of compiled include patterns.
         * @throws CrawlerSystemException if the patterns cannot be loaded.
         */
        @Override
        public List<Pattern> getIncludeUrlPatternList(final String sessionId) {
            try {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 20 08:40:57 UTC 2025
    - 9K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

            String sessionId = "test-session-024";
            urlFilter.init(sessionId);
    
            // Test empty pattern
            urlFilter.addInclude("");
            urlFilter.addExclude("");
    
            // Test single character pattern
            urlFilter.addInclude(".");
            urlFilter.addExclude("*");
    
            // Test patterns with only special characters
            urlFilter.addInclude("^$");
            urlFilter.addExclude(".*");
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  3. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlFilterServiceTest.java

                    .getTotalHits()
                    .value() > 0);
    
            // Verify pattern can be retrieved
            final List<Pattern> patterns = urlFilterService.getIncludeUrlPatternList(sessionId);
            assertEquals(1, patterns.size());
            assertTrue(patterns.get(0).matcher("http://example.com/page1").matches());
            assertFalse(patterns.get(0).matcher("http://other.com/page1").matches());
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 11.4K bytes
    - Viewed (0)
  4. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots_wildcard.txt

    # Based on RFC 9309 specification
    
    # Test wildcard patterns
    User-agent: WildcardBot
    Disallow: /*.pdf$
    Disallow: /admin/*.php
    Disallow: /*/private/
    Allow: /public/*.html
    
    # Test end-of-path ($) patterns
    User-agent: EndPathBot
    Disallow: /fish$
    Disallow: /temp$
    Allow: /fishing
    
    # Test complex patterns
    User-agent: ComplexBot
    Disallow: /
    Allow: /$
    Allow: /index.html$
    Allow: /public/
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 13 14:03:41 UTC 2025
    - 910 bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientFactory.java

    /**
     * A factory class for managing and creating crawler clients based on URL patterns.
     * This class implements AutoCloseable to properly handle resource cleanup.
     *
     * <p>The factory maintains a map of regular expression patterns to crawler clients,
     * allowing for URL-based client selection. Clients can be added with specific patterns
     * and optionally at specific positions in the processing order.</p>
     *
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 7.3K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

            private final int priorityLength;
    
            /**
             * Constructs a new PathPattern from the given robots.txt path pattern.
             * @param pattern the path pattern string from robots.txt (may contain * and $)
             */
            public PathPattern(final String pattern) {
                this.pattern = pattern;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 18.5K bytes
    - Viewed (0)
  7. cmd/endpoint-ellipses.go

    					symmetry = uint64(len(p.Seq))%ss == 0
    				} else {
    					symmetry = ss%uint64(len(p.Seq)) == 0
    				}
    			}
    		}
    		// With no arg patterns, it is expected that user knows
    		// the right symmetry, so either ellipses patterns are
    		// provided (recommended) or no ellipses patterns.
    		if _, ok := newSetCounts[ss]; !ok && (symmetry || argPatterns == nil) {
    			newSetCounts[ss] = struct{}{}
    		}
    	}
    
    	setCounts = []uint64{}
    Registered: Sun Dec 28 19:28:13 UTC 2025
    - Last Modified: Sun Sep 28 20:59:21 UTC 2025
    - 14.7K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/util/GsaConfigParser.java

        }
    
        /**
         * Converts a GSA URL pattern into a regular expression pattern suitable for Fess.
         * Handles various GSA pattern formats including regexp, contains, and URL-based patterns.
         *
         * @param s the input GSA pattern string
         * @return a regular expression pattern string, or empty string for comments/invalid patterns
         */
        protected String getFilterPath(final String s) {
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 21.6K bytes
    - Viewed (0)
  9. compat/maven-compat/src/test/java/org/apache/maven/artifact/resolver/filter/FilterHashEqualsTest.java

    /**
     */
    class FilterHashEqualsTest {
    
        @Test
        void testIncludesExcludesArtifactFilter() {
            List<String> patterns = Arrays.asList("c", "d", "e");
    
            IncludesArtifactFilter f1 = new IncludesArtifactFilter(patterns);
    
            IncludesArtifactFilter f2 = new IncludesArtifactFilter(patterns);
    
            assertTrue(f1.equals(f2), "Expected " + f1 + " to equal " + f2);
    Registered: Sun Dec 28 03:35:09 UTC 2025
    - Last Modified: Wed Sep 17 10:01:14 UTC 2025
    - 1.7K bytes
    - Viewed (0)
  10. CLAUDE.md

    **Flow**: Poll URL → Validate → Get client → Delay → Check last-modified → Execute → Process → Extract children → Queue children → Delay
    
    ### CrawlerClientFactory
    
    Pattern-based client selection using `LinkedHashMap<Pattern, CrawlerClient>`.
    
    **Standard Patterns**:
    ```java
    "^https?://.*"     → httpClient
    "^file:.*"         → fileSystemClient
    "^ftp://.*"        → ftpClient
    "^smb://.*"        → smbClient
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 28 17:31:34 UTC 2025
    - 10.7K bytes
    - Viewed (0)
Back to top