Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 31 for Disallow (0.04 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/RobotsTxtHelperTest.java

            assertFalse(robotsTxt.allows("/store/public/sale", "PriorityBot")); // Most specific disallow
            assertFalse(robotsTxt.allows("/store/public/sale/item", "PriorityBot"));
    
            // Test SameLengthBot - Allow wins when same length as Disallow
            // Disallow: /page, Allow: /page
            assertTrue(robotsTxt.allows("/page", "SameLengthBot")); // Allow takes precedence
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 20.6K bytes
    - Viewed (0)
  2. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots_wildcard.txt

    User-agent: PriorityBot
    Disallow: /store
    Allow: /store/public
    Disallow: /store/public/sale
    
    # Test Allow vs Disallow with same length (Allow wins)
    User-agent: SameLengthBot
    Disallow: /page
    Allow: /page
    
    # Test multiple wildcards
    User-agent: MultiWildcardBot
    Disallow: /*.cgi*
    Disallow: /*?*id=*
    
    # Test literal $ in middle of pattern
    User-agent: DollarBot
    Disallow: /price$info
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 13 14:03:41 UTC 2025
    - 910 bytes
    - Viewed (0)
  3. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots_malformed.txt

    Disallow: /test/
    
    # Case 9: Special characters in paths
    User-agent: SpecialCharBot
    Disallow: /path with spaces/
    Disallow: /path%20encoded/
    Disallow: /path?query=value
    Disallow: /path#fragment
    Allow: /unicode/日本語/
    
    # Case 10: Multiple User-agents in sequence
    User-agent: Bot1
    User-agent: Bot2
    User-agent: Bot3
    Disallow: /shared/
    
    # Case 11: Sitemap with various formats
    Sitemap: http://example.com/sitemap.xml
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 14 12:52:01 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

     *
     * <p>Key features:</p>
     * <ul>
     *   <li>Supports multiple user-agent directives with pattern matching</li>
     *   <li>Handles Allow and Disallow rules for path-based access control</li>
     *   <li>Manages crawl delay settings per user agent</li>
     *   <li>Stores sitemap URLs listed in robots.txt</li>
     * </ul>
     *
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 18.5K bytes
    - Viewed (0)
  5. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                tempDir.mkdirs();
    
                final StringBuilder buf = new StringBuilder();
                buf.append("User-agent: *").append('\n');
                buf.append("Disallow: /admin/").append('\n');
                buf.append("Disallow: /websvn/").append('\n');
                final File robotTxtFile = new File(tempDir, "robots.txt");
                FileUtil.writeBytes(robotTxtFile.getAbsolutePath(), buf.toString().getBytes("UTF-8"));
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 5K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

     * <li>Disallow and Allow directives with pattern matching</li>
     * <li>Wildcard (*) in paths - matches any sequence of characters</li>
     * <li>End-of-path ($) matching - matches the end of URL path</li>
     * <li>Crawl-delay directive</li>
     * <li>Sitemap directive</li>
     * <li>Comment support (#)</li>
     * <li>Priority-based matching (longest match wins, Allow beats Disallow at equal length)</li>
     * </ul>
     *
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 14 12:52:01 UTC 2025
    - 11.4K bytes
    - Viewed (0)
  7. regression-test/src/androidTest/java/okhttp/regression/compare/AndroidHttpEngineTest.kt

        try {
          val response = completableFuture.get(10, TimeUnit.SECONDS)
    
          assertEquals(200, response.code)
          assertEquals("h3", response.negotiatedProtocol)
          assertTrue(response.content.contains("Disallow"))
        } catch (ee: ExecutionException) {
          throw ee.cause?.cause ?: ee.cause!!
        }
      }
    
      data class Response(
        val code: Int,
        val negotiatedProtocol: String,
        val content: String,
    Registered: Fri Dec 26 11:42:13 UTC 2025
    - Last Modified: Wed Mar 19 19:25:20 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                tempDir.mkdirs();
    
                // robots.txt
                StringBuilder buf = new StringBuilder();
                buf.append("User-agent: *").append('\n');
                buf.append("Disallow: /admin/").append('\n');
                buf.append("Disallow: /websvn/").append('\n');
                final File robotTxtFile = new File(tempDir, "robots.txt");
                FileUtil.writeBytes(robotTxtFile.getAbsolutePath(), buf.toString().getBytes("UTF-8"));
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  9. fess-crawler/src/test/java/org/codelibs/fess/crawler/entity/RobotsTxtTest.java

            directive.addDisallow("/admin/");
            directive.addDisallow("/private/");
    
            String[] disallows = directive.getDisallows();
            assertEquals(2, disallows.length);
            assertEquals("/admin/", disallows[0]);
            assertEquals("/private/", disallows[1]);
        }
    
        public void test_directiveAddDisallowNoDuplicates() {
            // Test that addDisallow doesn't add duplicates
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 13 13:29:22 UTC 2025
    - 14.4K bytes
    - Viewed (0)
  10. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                tempDir.mkdirs();
    
                // robots.txt
                StringBuilder buf = new StringBuilder();
                buf.append("User-agent: *").append('\n');
                buf.append("Disallow: /admin/").append('\n');
                buf.append("Disallow: /websvn/").append('\n');
                final File robotTxtFile = new File(tempDir, "robots.txt");
                FileUtil.writeBytes(robotTxtFile.getAbsolutePath(), buf.toString().getBytes("UTF-8"));
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
Back to top