Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 1 of 1 for getRobotsTxtUrlSet (1.99 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

            } else {
                hostUrl = url;
            }
            final String robotTxtUrl = hostUrl + "/robots.txt";
    
            // check url
            if (crawlerContext.getRobotsTxtUrlSet().contains(robotTxtUrl)) {
                if (logger.isDebugEnabled()) {
                    logger.debug("{} is already visited.", robotTxtUrl);
                }
                return;
            }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 52.2K bytes
    - Viewed (0)
Back to top