Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 5 of 5 for storeChildUrls (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java

                    if (crawlerContext.getMaxDepth() < 0 || depth <= crawlerContext.getMaxDepth()) {
                        // add and filter urls
                        storeChildUrls(crawlerContext, resultData.getChildUrlSet(), urlQueue.getUrl(), depth, resultData.getEncoding());
                    }
                } else if (crawlerContext.getMaxDepth() < 0 || urlQueue.getDepth() <= crawlerContext.getMaxDepth()) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 12.5K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

     *   <li>Processing the response using a {@link ResponseProcessor} associated with a {@link Rule}.</li>
     *   <li>Extracting child URLs and adding them to the queue using {@link #storeChildUrls(Set, String, int)}
     *       or {@link #storeChildUrl(String, String, float, int)}.</li>
     *   <li>Handling exceptions that may occur during the crawling process.</li>
     * </ol>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

            try {
                // data
                storeData(responseData, resultData);
    
                if (isHtml(responseData) && !responseData.isNoFollow()) {
                    // urls
                    storeChildUrls(responseData, resultData);
                }
            } finally {
                xpathAPI.remove();
            }
    
            final Object redirectUrlObj = responseData.getMetaDataMap().get(LOCATION_HEADER);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 28.5K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java

         */
        protected void storeChildUrlsToQueue(final UrlQueue<?> urlQueue, final Set<RequestData> childUrlSet) {
            if (childUrlSet != null) {
                // add an url
                try {
                    storeChildUrls(childUrlSet.stream().filter(rd -> StringUtil.isNotBlank(rd.getUrl())).collect(Collectors.toSet()),
                            urlQueue.getUrl(), urlQueue.getDepth() != null ? urlQueue.getDepth() + 1 : 1);
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/crawler/transformer/FessXpathTransformer.java

                    }
                    if (noindex) {
                        logger.info("META(robots=noindex): {}", responseData.getUrl());
                        storeChildUrls(responseData, resultData);
                        throw new ChildUrlsException(resultData.getChildUrlSet(), "#processMetaRobots");
                    }
                    if (nofollow) {
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 54.4K bytes
    - Viewed (0)
Back to top