Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 14 for Wildcard (0.38 sec)

  1. src/main/java/org/codelibs/fess/query/WildcardQueryCommand.java

    import org.opensearch.index.query.QueryBuilder;
    import org.opensearch.index.query.QueryBuilders;
    
    /**
     * Query command for handling wildcard queries.
     * Converts Lucene WildcardQuery objects to OpenSearch QueryBuilder objects,
     * supporting wildcard pattern matching with configurable case sensitivity.
     */
    public class WildcardQueryCommand extends QueryCommand {
    
        /**
         * Default constructor.
         */
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 5.7K bytes
    - Viewed (0)
  2. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots_wildcard.txt

    # Test robots.txt for wildcard (*) and end-of-path ($) support
    # Based on RFC 9309 specification
    
    # Test wildcard patterns
    User-agent: WildcardBot
    Disallow: /*.pdf$
    Disallow: /admin/*.php
    Disallow: /*/private/
    Allow: /public/*.html
    
    # Test end-of-path ($) patterns
    User-agent: EndPathBot
    Disallow: /fish$
    Disallow: /temp$
    Allow: /fishing
    
    # Test complex patterns
    User-agent: ComplexBot
    Disallow: /
    Allow: /$
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 13 14:03:41 UTC 2025
    - 910 bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

     *   <li>Manages crawl delay settings per user agent</li>
     *   <li>Stores sitemap URLs listed in robots.txt</li>
     * </ul>
     *
     * <p>The class uses case-insensitive pattern matching for user agents and supports
     * wildcard characters (*) in user agent strings. When multiple directives match a user agent,
     * the most specific (longest) match is used.</p>
     *
     */
    public class RobotsTxt {
        private static final String ALL_BOTS = "*";
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 18.5K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/query/PrefixQueryCommand.java

            }
            return value;
        }
    
        /**
         * Sets the lowercase wildcard flag.
         *
         * @param lowercaseWildcard the lowercase wildcard flag
         */
        public void setLowercaseWildcard(final boolean lowercaseWildcard) {
            this.lowercaseWildcard = lowercaseWildcard;
        }
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 5.1K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/cors/CorsHandlerFactory.java

         */
        protected Map<String, CorsHandler> handerMap = new HashMap<>();
    
        /**
         * Adds a CORS handler for the specified origin.
         *
         * @param origin the origin pattern (can be "*" for wildcard)
         * @param handler the CORS handler to associate with the origin
         */
        public void add(final String origin, final CorsHandler handler) {
            if (logger.isDebugEnabled()) {
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 2.2K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/RobotsTxtHelperTest.java

            try {
                robotsTxt = robotsTxtHelper.parse(in);
            } finally {
                CloseableUtil.closeQuietly(in);
            }
    
            // Test WildcardBot - wildcard patterns
            // Disallow: /*.pdf$ - should block .pdf files but not .pdf with query params
            assertFalse(robotsTxt.allows("/document.pdf", "WildcardBot"));
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 20.6K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

    /**
     * Robots.txt Parser following RFC 9309 specification.
     *
     * <p>This implementation supports the following features:</p>
     * <ul>
     * <li>User-agent directive with wildcard (*) matching</li>
     * <li>Disallow and Allow directives with pattern matching</li>
     * <li>Wildcard (*) in paths - matches any sequence of characters</li>
     * <li>End-of-path ($) matching - matches the end of URL path</li>
     * <li>Crawl-delay directive</li>
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 14 12:52:01 UTC 2025
    - 11.4K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/suggest/util/SuggestUtil.java

            }
        }
    
        /**
         * Escapes wildcard characters in the given query string.
         *
         * This method replaces all occurrences of '*' with '\*' and
         * all occurrences of '?' with '\?' to ensure that these characters
         * are treated as literals rather than wildcard characters in queries.
         *
         * @param query the query string to escape
    Registered: Sat Dec 20 13:04:59 UTC 2025
    - Last Modified: Sun Nov 23 11:21:40 UTC 2025
    - 17.5K bytes
    - Viewed (1)
  9. src/main/java/org/codelibs/fess/query/TermQueryCommand.java

            context.addFieldLog(field, text);
            context.addHighlightedQuery(text);
            return QueryBuilders.termQuery(field, text).boost(boost);
        }
    
        /**
         * Converts a term query to a wildcard query for URL field matching.
         *
         * @param fessConfig the Fess configuration
         * @param context the query context
         * @param termQuery the term query to convert
         * @param boost the boost value to apply
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 13.6K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/entity/RobotsTxtTest.java

            assertNotNull(matched);
            assertEquals("MyBot", matched.getUserAgent());
        }
    
        public void test_getMatchedDirectiveWithWildcard() {
            // Test getMatchedDirective with wildcard
            RobotsTxt robotsTxt = new RobotsTxt();
    
            Directive directive = new Directive("*");
            directive.addDisallow("/private/");
            robotsTxt.addDirective(directive);
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 13 13:29:22 UTC 2025
    - 14.4K bytes
    - Viewed (0)
Back to top