Search Options

Display Count
Sort
Preferred Language
Advanced Search

Results 1 - 3 of 3 for getRobotsTxtUrlSet (0.13 seconds)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java

            this.intervalController = intervalController;
        }
    
        /**
         * Returns the set of robots.txt URLs.
         * @return The set of robots.txt URLs.
         */
        public Set<String> getRobotsTxtUrlSet() {
            return robotsTxtUrlSet;
        }
    
        /**
         * Sets the set of robots.txt URLs.
         * @param robotsTxtUrlSet The set of robots.txt URLs.
         */
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Wed Dec 31 09:07:38 GMT 2025
    - 9K bytes
    - Click Count (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/Hc4HttpClient.java

            } else {
                hostUrl = url;
            }
            final String robotTxtUrl = hostUrl + "/robots.txt";
    
            // check url
            if (crawlerContext.getRobotsTxtUrlSet().contains(robotTxtUrl)) {
                if (logger.isDebugEnabled()) {
                    logger.debug("{} is already visited.", robotTxtUrl);
                }
                return;
            }
    
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Fri Jan 09 23:46:52 GMT 2026
    - 54.4K bytes
    - Click Count (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/Hc5HttpClient.java

            } else {
                hostUrl = url;
            }
            final String robotTxtUrl = hostUrl + "/robots.txt";
    
            // check url
            if (crawlerContext.getRobotsTxtUrlSet().contains(robotTxtUrl)) {
                if (logger.isDebugEnabled()) {
                    logger.debug("{} is already visited.", robotTxtUrl);
                }
                return;
            }
    
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Sat Jan 31 12:23:29 GMT 2026
    - 62.2K bytes
    - Click Count (0)
Back to Top