- Sort Score
- Result 10 results
- Languages All
Results 31 - 40 of 44 for Extract (0.04 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPublisherExtractor.java
public class MsPublisherExtractor extends AbstractExtractor { /** * Creates a new MsPublisherExtractor instance. */ public MsPublisherExtractor() { super(); } /** * Extracts text from the Publisher input stream. * @param in The input stream. * @param params The parameters. * @return The extracted data. */ @OverrideRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/XmlExtractor.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.extractor.impl; import java.util.regex.Pattern; /** * Extracts text content from XML documents. */ public class XmlExtractor extends AbstractXmlExtractor { /** * Creates a new XmlExtractor instance. */ public XmlExtractor() { super(); }Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TextExtractor.java
import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExtractException; /** * Extracts text content from an input stream as plain text. */ public class TextExtractor extends AbstractExtractor { /** * The encoding for text. */ protected String encoding = Constants.UTF_8;Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsVisioExtractor.java
*/ public class MsVisioExtractor extends AbstractExtractor { /** * Creates a new MsVisioExtractor instance. */ public MsVisioExtractor() { super(); } /** * Extracts text from the Visio input stream. * @param in The input stream. * @param params The parameters. * @return The extracted data. */ @OverrideRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/BinaryTransformer.java
* into a ResultData object, and for retrieving the binary data from an AccessResultData object. * It extends the AbstractTransformer class. * * <p> * This transformer extracts the binary content from the response body of a web resource, * stores it as a byte array in the ResultData, and provides a method to retrieve this data * as a ByteArrayInputStream. * </p> * * <p>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java
* */ public class MsWordExtractor extends AbstractExtractor { /** * Creates a new MsWordExtractor instance. */ public MsWordExtractor() { super(); } /** * Extracts text from the Word input stream. * @param in The input stream. * @param params The parameters. * @return The extracted data. */ @OverrideRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsExcelExtractor.java
*/ public class MsExcelExtractor extends AbstractExtractor { /** * Creates a new MsExcelExtractor instance. */ public MsExcelExtractor() { super(); } /** * Extracts text from the Excel input stream. * @param in The input stream. * @param params The parameters. * @return The extracted data. */ @OverrideRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/HostIntervalController.java
super(params); } /** * Delays before processing a URL, ensuring that requests to the same host are not made too frequently. * This method extracts the host from the URL and enforces a delay based on the configured * delayMillisBeforeProcessing parameter. * * @throws InterruptedRuntimeException if the thread is interrupted during the delay
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.2K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/RegexRule.java
* only one of them (allRequired = false). It also supports a default rule that always matches. * * <p> * The class uses a map of field names to Pattern objects to store the regular expressions. * The match method extracts the values of the specified fields from the ResponseData and * applies the corresponding regular expressions. * </p> * * <p> * Example usage: * </p> * * <pre> * {@code
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 6.2K bytes - Viewed (0) -
fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchDataService.java
} catch (final Exception e) { throw new OpenSearchAccessException("response: " + response, e); } } return targetList; } /** * Extracts a field value from OpenSearch results and converts it to the specified type. * * @param <T> The target type. * @param field The field value from OpenSearch. * @param clazz The target class.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 10.9K bytes - Viewed (0)