- Sort Score
- Result 10 results
- Languages All
Results 1 - 3 of 3 for href (0.01 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java
} return parser; } /** * Gets the base href from the document's BASE tag. * * @param document the document to extract base href from * @return the base href URL, or null if not found */ protected String getBaseHref(final Document document) { try {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 28.5K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
final Map<String, String> childUrlRuleMap = newHashMap(); childUrlRuleMap.put("//A", "href"); childUrlRuleMap.put("//AREA", "href"); childUrlRuleMap.put("//FRAME", "src"); childUrlRuleMap.put("//IFRAME", "src"); childUrlRuleMap.put("//IMG", "src"); childUrlRuleMap.put("//LINK", "href"); childUrlRuleMap.put("//SCRIPT", "src"); container = new StandardCrawlerContainer();
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 19.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java
import org.codelibs.fess.crawler.entity.RobotsTxt.Directive; import org.codelibs.fess.crawler.exception.RobotsTxtException; /** * Robots.txt Specifications: * <ul> * <li><a href= * "https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt" * >https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt * </a></li> * </ul> * * @author bowez
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 7.7K bytes - Viewed (0)