Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 66 for example (0.03 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

            urlFilter.addInclude("https?://[^/]+\\.example\\.com/.*");
    
            assertTrue(urlFilter.match("http://www.example.com/"));
            assertTrue(urlFilter.match("https://api.example.com/v1/users"));
            assertTrue(urlFilter.match("http://subdomain.example.com/page"));
            assertFalse(urlFilter.match("https://example.org/"));
            assertFalse(urlFilter.match("ftp://files.example.com/"));
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  2. fess-crawler/src/test/resources/extractor/test.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <address xmlns:hoge="http://www.example.com/hoge">
    	<item sex="male" custid="A12345">
    		<name>鈴木太郎</name>
    		<access kind="email"></access>
    		<access kind="url">http://www.taro.com/</access>
    		<image file="taro.png" />
    	</item>
    	<item sex="male" custid="B23456">
    		<name>佐藤二朗</name>
    		<access kind="email">******@****.***</access>
    		<image file="jiro.png" />
    	</item>
    	<item sex="female" custid="C34567">
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 582 bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/AbstractRuleTest.java

            // Set patterns
            conditionalRule.setUrlPattern("https?://.*\\.example\\.com/.*");
            conditionalRule.setMimeTypePattern("text/.*");
    
            // Test matching
            ResponseData responseData1 = new ResponseData();
            responseData1.setUrl("http://www.example.com/page");
            responseData1.setMimeType("text/html");
            assertTrue(conditionalRule.match(responseData1));
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 21.9K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/http/HcHttpClientTest.java

            assertEquals("http://example.com:8080/path/file", HcHttpClient.constructRedirectLocation("http://example.com:8080/path/", "file"));
            assertEquals("http://example.com/%E3%83%86%E3%82%B9%E3%83%88",
                    HcHttpClient.constructRedirectLocation("http://example.com/", "テスト"));
            assertEquals("http://example.com/hello%20world", HcHttpClient.constructRedirectLocation("http://example.com/", "hello world"));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.7K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/XPathAPI.java

     *
     * <p>Example usage:</p>
     * <pre>
     * {@code
     * XPathAPI xPathAPI = new XPathAPI();
     * NodeList nodes = xPathAPI.selectNodeList(contextNode, "//example");
     * Node singleNode = xPathAPI.selectSingleNode(contextNode, "//example[1]");
     * XPathEvaluationResult<?> result = xPathAPI.eval(contextNode, "count(//example)");
     * }
     * </pre>
     *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.6K bytes
    - Viewed (0)
  6. fess-crawler/src/test/resources/sitemaps/sitemap1.xml

       <url>
          <loc>http://www.example.com/</loc>
          <lastmod>2005-01-01</lastmod>
          <changefreq>monthly</changefreq>
          <priority>0.8</priority>
       </url>
       <url>
          <loc>http://www.example.com/catalog?item=12&amp;desc=vacation_hawaii</loc>
          <changefreq>weekly</changefreq>
       </url>
       <url>
          <loc>http://www.example.com/catalog?item=73&amp;desc=vacation_new_zealand</loc>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 915 bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/FileTransformerTest.java

            url = "http://www.example.com/";
            assertEquals("http_CLN_/www.example.com/index.html", fileTransformer.getFilePath(url));
    
            url = "http://www.example.com/action?a=1";
            assertEquals("http_CLN_/www.example.com/action_QUEST_a=1", fileTransformer.getFilePath(url));
    
            url = "http://www.example.com/action?a=1&b=2";
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 7.6K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImplTest.java

        }
    
        public void test_match_both() {
            urlFilter.addInclude("http://example.com/.*");
            urlFilter.addExclude("http://example.com/a.*");
    
            final String sessionId = "id1";
            urlFilter.init(sessionId);
    
            assertTrue(urlFilter.match("http://example.com/"));
            assertFalse(urlFilter.match("http://example.com/a"));
            assertFalse(urlFilter.match("http://test.com/"));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.9K bytes
    - Viewed (0)
  9. fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/RobotsTxtHelperTest.java

            String[] sitemaps = robotsTxt.getSitemaps();
            assertEquals(2, sitemaps.length);
            assertEquals("http://www.example.com/sitmap.xml", sitemaps[0]);
            assertEquals("http://www.example.net/sitmap.xml", sitemaps[1]);
    
        }
    
        public void testParse_disable() {
            final InputStream in = RobotsTxtHelperTest.class.getResourceAsStream("robots.txt");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 5.9K bytes
    - Viewed (0)
  10. README.md

            Crawler crawler = container.getComponent("crawler");
            
            // Configure crawling parameters
            crawler.addUrl("https://example.com");
            crawler.crawlerContext.setMaxAccessCount(100);
            crawler.crawlerContext.setNumOfThread(5);
            crawler.urlFilter.addInclude("https://example.com/.*");
            
            // Execute crawling
            String sessionId = crawler.execute();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
Back to top