Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 7 of 7 for RegexRule (0.04 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/RegexRule.java

     * applies the corresponding regular expressions.
     * </p>
     *
     * <p>
     * Example usage:
     * </p>
     *
     * <pre>
     * {@code
     * RegexRule rule = new RegexRule();
     * rule.addRule("url", "https://example.com/.*");
     * rule.addRule("contentType", "text/html");
     * rule.setAllRequired(true); // Both URL and content type must match
     *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.2K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/RegexRuleTest.java

            assertTrue(regexRule.match(getTestData4()));
        }
    
        public void test_match_url() {
            final RegexRule regexRule = new RegexRule();
            regexRule.defaultRule = false;
            regexRule.allRequired = true;
            regexRule.addRule("url", Pattern.compile("http:.*"));
    
            assertTrue(regexRule.match(getTestData1()));
            assertFalse(regexRule.match(getTestData2()));
            assertTrue(regexRule.match(getTestData3()));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 4.8K bytes
    - Viewed (0)
  3. src/main/resources/crawler/rule.xml

    			<arg>fsFileRule</arg>
    		</postConstruct>
    		<postConstruct name="addRule">
    			<arg>defaultRule</arg>
    		</postConstruct>
    	</component>
    
    	<component name="sitemapsRule" class="org.codelibs.fess.crawler.rule.impl.RegexRule" >
    		<property name="ruleId">"sitemapsRule"</property>
    		<property name="responseProcessor">
    			<component class="org.codelibs.fess.crawler.processor.impl.SitemapsResponseProcessor">
    			</component>
    		</property>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jun 04 08:42:49 UTC 2020
    - 4.6K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/RuleManagerImplTest.java

            assertNotNull(rule);
            assertEquals("fileRule", rule.getRuleId());
    
            final RegexRule rule2 = new RegexRule();
            rule2.setAllRequired(true);
            rule2.addRule("url", "http:.*");
    
            final RegexRule rule3 = new RegexRule();
            rule3.addRule("url", "http:.*");
    
            assertFalse(ruleManager.hasRule(rule2));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.2K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/SitemapsRule.java

    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.codelibs.fess.crawler.helper.SitemapsHelper;
    
    /**
     * SitemapsRule is a rule implementation that extends RegexRule to determine if a given response data
     * represents a valid sitemap. It uses a SitemapsHelper to validate the response body as an InputStream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  6. fess-crawler-lasta/src/main/resources/crawler/rule.xml

    		</property>
    		<postConstruct name="addRule">
    			<arg>"url"</arg>
    			<arg>".*sitemap.*"</arg>
    		</postConstruct>
    	</component>
    
    	<component name="fileRule" class="org.codelibs.fess.crawler.rule.impl.RegexRule">
    		<property name="ruleId">"fileRule"</property>
    		<property name="defaultRule">true</property>
    		<property name="responseProcessor">
    			<component
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 1.5K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                        processor.setSuccessfulHttpCodes(new int[] { 200 });
                        processor.setNotModifiedHttpCodes(new int[] { 304 });
                    })//
                    .<RegexRule> singleton("fileRule", RegexRule.class, rule -> {
                        rule.setRuleId("fileRule");
                        rule.setDefaultRule(true);
                        rule.setResponseProcessor(container.getComponent("defaultResponseProcessor"));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 19.1K bytes
    - Viewed (0)
Back to top