- Sort Score
- Result 10 results
- Languages All
Results 1 - 2 of 2 for HtmlExtractor (0.06 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java
import org.w3c.dom.Node; import org.xml.sax.InputSource; /** * Extracts text content from HTML documents. */ public class HtmlExtractor extends AbstractXmlExtractor { /** Logger for this class. */ protected static final Logger logger = LogManager.getLogger(HtmlExtractor.class); /** Pattern for extracting charset from meta tags. */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 9.3K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractorTest.java
public HtmlExtractor htmlExtractor; @Override protected void setUp() throws Exception { super.setUp(); StandardCrawlerContainer container = new StandardCrawlerContainer().singleton("htmlExtractor", HtmlExtractor.class); htmlExtractor = container.getComponent("htmlExtractor"); htmlExtractor.addMetadata("title", "//TITLE"); }
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 3.7K bytes - Viewed (0)