Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 6 of 6 for RobotsTxtHelper (0.13 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

        /** Whether robots.txt processing is enabled. */
        protected boolean enabled = true;
    
        /**
         * Creates a new RobotsTxtHelper instance.
         */
        public RobotsTxtHelper() {
            // Default constructor
        }
    
        /**
         * Parses a robots.txt file from the given input stream using UTF-8 encoding.
         * @param stream the input stream to parse
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/RobotsTxtHelperTest.java

    public class RobotsTxtHelperTest extends PlainTestCase {
        public RobotsTxtHelper robotsTxtHelper;
    
        @Override
        protected void setUp() throws Exception {
            super.setUp();
            StandardCrawlerContainer container = new StandardCrawlerContainer().singleton("robotsTxtHelper", RobotsTxtHelper.class);
            robotsTxtHelper = container.getComponent("robotsTxtHelper");
        }
    
        public void testParse() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 5.9K bytes
    - Viewed (0)
  3. fess-crawler-lasta/src/main/resources/crawler/robotstxt.xml

    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    
    	<component name="robotsTxtHelper" class="org.codelibs.fess.crawler.helper.RobotsTxtHelper"
    		instance="prototype">
    	</component>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 367 bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/http/HcHttpClientTest.java

                    .singleton("urlFilterService", UrlFilterServiceImpl.class)//
                    .singleton("urlFilter", UrlFilterImpl.class)//
                    .singleton("robotsTxtHelper", RobotsTxtHelper.class)//
                    .singleton("httpClient", HcHttpClient.class);
            httpClient = container.getComponent("httpClient");
            urlFilter = container.getComponent("urlFilter");
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.7K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

        /** Logger instance for this class */
        private static final Logger logger = LogManager.getLogger(HcHttpClient.class);
    
        /** Helper for processing robots.txt files */
        @Resource
        protected RobotsTxtHelper robotsTxtHelper;
    
        /** Helper for managing content length limits */
        @Resource
        protected ContentLengthHelper contentLengthHelper;
    
        /** Helper for determining MIME types */
        @Resource
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 52.2K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                        transformer.setChildUrlRuleMap(childUrlRuleMap);
                    })
                    .singleton("dataHelper", MemoryDataHelper.class)
                    .singleton("robotsTxtHelper", RobotsTxtHelper.class)
                    .<CrawlerClientFactory> singleton("clientFactory", CrawlerClientFactory.class, factory -> {
                        factory.addClient("http:.*", container.getComponent("httpClient"));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 19.1K bytes
    - Viewed (0)
Back to top