- Sort Score
- Result 10 results
- Languages All
Results 191 - 200 of 658 for crawler (0.05 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/Rule.java
*/ package org.codelibs.fess.crawler.rule; import java.io.Serializable; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.processor.ResponseProcessor; /** * The Rule interface defines the contract for implementing rules that can be applied to * response data in a web crawler. Implementations of this interface should provide logic
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 1.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/ChildUrlsException.java
* either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.exception; import java.util.Set; import org.codelibs.fess.crawler.entity.RequestData; /** * {@link ChildUrlsException} is thrown when child URLs are found during crawling.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/ExecutionTimeoutException.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.exception; /** * An exception indicating that the execution of a process has timed out. * This exception extends {@link org.codelibs.fess.crawler.exception.ExtractException}. * */ public class ExecutionTimeoutException extends ExtractException {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 1.8K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessorTest.java
* either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.processor.impl; import org.codelibs.fess.crawler.entity.ResponseData; import org.dbflute.utflute.core.PlainTestCase; /** * @author shinsuke * */ public class DefaultResponseProcessorTest extends PlainTestCase {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 2.3K bytes - Viewed (0) -
fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/util/OpenSearchCrawlerConfig.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.util; /** * Configuration class for OpenSearch crawler settings. * This class provides configuration for index names, shards, and replicas * for the queue, data, and filter indices used by the crawler. */ public class OpenSearchCrawlerConfig { /** * Constructs a new OpenSearchCrawlerConfig. */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 5.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/CommandExtractor.java
import org.codelibs.core.lang.StringUtil; import org.codelibs.core.lang.ThreadUtil; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExecutionTimeoutException; import org.codelibs.fess.crawler.exception.ExtractException; /** * Extracts text content by executing an external command. */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 16K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/ResponseProcessor.java
* either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.processor; import org.codelibs.fess.crawler.entity.ResponseData; /** * The ResponseProcessor interface defines a contract for processing response data. * Implementations of this interface are responsible for handling the response data
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 1.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java
import java.util.regex.Pattern; import javax.xml.xpath.XPathNodes; import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExtractException; import org.codelibs.fess.crawler.util.XPathAPI; import org.codelibs.nekohtml.parsers.DOMParser; import org.w3c.dom.Document; import org.w3c.dom.Node;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10.3K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/transformer/FessXpathTransformer.java
import org.codelibs.fess.Constants; import org.codelibs.fess.crawler.builder.RequestDataBuilder; import org.codelibs.fess.crawler.entity.AccessResultData; import org.codelibs.fess.crawler.entity.RequestData; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; import org.codelibs.fess.crawler.entity.UrlQueue; import org.codelibs.fess.crawler.exception.ChildUrlsException;
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 54.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/UrlConvertHelper.java
* either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.helper; import java.util.LinkedHashMap; import java.util.Map; import org.codelibs.fess.crawler.exception.CrawlerSystemException; /** * Helper class for converting URLs based on a set of predefined rules. *
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.1K bytes - Viewed (0)