- Sort Score
- Result 10 results
- Languages All
Results 1 - 7 of 7 for getChildUrlSet (0.28 sec)
-
fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformerTest.java
final ResultData resultData = htmlTransformer.transform(responseData); assertEquals(content, new String(resultData.getData())); assertEquals(1, resultData.getChildUrlSet().size()); assertEquals("http://hoge/test2.html", resultData.getChildUrlSet().iterator().next().getUrl()); } public void test_transform_urllink() { String content = "<a href=\"http://fuga/test.html\">test</a>";
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 13.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java
} final int depth = urlQueue.getDepth() == null ? 1 : urlQueue.getDepth() + 1; if (crawlerContext.getMaxDepth() < 0 || depth <= crawlerContext.getMaxDepth()) { // add and filter urls storeChildUrls(crawlerContext, resultData.getChildUrlSet(), urlQueue.getUrl(), depth, resultData.getEncoding());
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 12.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ResultData.java
this.transformerName = transformerName; } /** * Get the child URL set. * @return childUrlSet */ public Set<RequestData> getChildUrlSet() { return childUrlSet; } /** * Set the child URL set. * @param childUrlSet the set of request data to set as child URLs */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.7K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java
fessConfig.getIndexFieldClickCount(), fessConfig.getIndexFieldFavoriteCount() }); if (document == null) { storeChildUrlsToQueue(urlQueue, getChildUrlSet(searchEngineClient, id)); return true; } final Date expires = DocumentUtil.getValue(document, fessConfig.getIndexFieldExpires(), Date.class);
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 19.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ResponseData.java
childUrlSet.remove(url); } /** * Gets the set of child URLs discovered from this response. * * @return the set of child URLs */ public Set<RequestData> getChildUrlSet() { return childUrlSet; } /** * Creates a RequestData object from this response's URL and method. *
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 11.6K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/transformer/FessXpathTransformer.java
logger.info("META(robots=noindex): {}", responseData.getUrl()); storeChildUrls(responseData, resultData); throw new ChildUrlsException(resultData.getChildUrlSet(), "#processMetaRobots"); } if (nofollow) { logger.info("META(robots=nofollow): {}", responseData.getUrl()); responseData.setNoFollow(true);
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 54.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java
} requestDataList = convertChildUrlList(requestDataList); resultData.addAllUrl(requestDataList); }); resultData.addAllUrl(responseData.getChildUrlSet()); final RequestData requestData = responseData.getRequestData(); resultData.removeUrl(requestData); resultData.removeUrl(getDuplicateUrl(requestData));
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 28.5K bytes - Viewed (0)