- Sort Score
- Result 10 results
- Languages All
Results 181 - 190 of 460 for Crawler (0.16 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsVisioExtractor.java
*/ package org.codelibs.fess.crawler.extractor.impl; import java.io.IOException; import java.io.InputStream; import java.util.Map; import org.apache.poi.hdgf.extractor.VisioTextExtractor; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExtractException; /** * Gets a text from . file.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/Rule.java
*/ package org.codelibs.fess.crawler.rule; import java.io.Serializable; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.processor.ResponseProcessor; /** * The Rule interface defines the contract for implementing rules that can be applied to * response data in a web crawler. Implementations of this interface should provide logic
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 1.7K bytes - Viewed (0) -
fess-crawler-lasta/src/main/resources/crawler/urlconverter.xml
<!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" "http://dbflute.org/meta/lastadi10.dtd"> <components namespace="fessCrawler"> <include path="crawler/container.xml" /> <!-- Converts child links to normalize it. --> <component name="urlConvertHelper" class="org.codelibs.fess.crawler.helper.UrlConvertHelper"> </component>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 394 bytes - Viewed (0) -
src/main/java/org/codelibs/fess/opensearch/config/exentity/WebConfig.java
import org.codelibs.fess.app.service.RequestHeaderService; import org.codelibs.fess.app.service.WebAuthenticationService; import org.codelibs.fess.crawler.client.CrawlerClientFactory; import org.codelibs.fess.crawler.client.http.Authentication; import org.codelibs.fess.crawler.client.http.HcHttpClient; import org.codelibs.fess.helper.SystemHelper; import org.codelibs.fess.mylasta.direction.FessConfig;
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Sat Mar 15 06:53:53 UTC 2025 - 9.9K bytes - Viewed (0) -
src/main/resources/crawler/extractor+tikaExtractor.xml
<!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" "http://dbflute.org/meta/lastadi10.dtd"> <components namespace="fessCrawler"> <include path="crawler/container.xml" /> <component name="tikaExtractor" class="org.codelibs.fess.crawler.extractor.impl.TikaExtractor"> <property name="maxCompressionRatio">2</property> <property name="maxUncompressionSize">10000000</property> </component>
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Sun Aug 25 12:46:12 UTC 2019 - 461 bytes - Viewed (0) -
fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/util/OpenSearchCrawlerConfig.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.util; /** * Configuration class for OpenSearch crawler settings. * This class provides configuration for index names, shards, and replicas * for the queue, data, and filter indices used by the crawler. */ public class OpenSearchCrawlerConfig { /** * Constructs a new OpenSearchCrawlerConfig. */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 5.4K bytes - Viewed (0) -
fess-crawler/pom.xml
<modelVersion>4.0.0</modelVersion> <artifactId>fess-crawler</artifactId> <packaging>jar</packaging> <name>Fess Crawler</name> <description>Fess Crawler is a crawler framework.</description> <parent> <groupId>org.codelibs.fess</groupId> <artifactId>fess-crawler-parent</artifactId> <version>15.3.0-SNAPSHOT</version> <relativePath>../pom.xml</relativePath> </parent>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 11.3K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/helper/PermissionHelper.java
import org.apache.logging.log4j.Logger; import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.crawler.client.fs.FileSystemClient; import org.codelibs.fess.crawler.client.ftp.FtpClient; import org.codelibs.fess.crawler.client.smb.SmbClient; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.exception.CrawlingAccessException; import org.codelibs.fess.mylasta.direction.FessConfig;
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 15.3K bytes - Viewed (0) -
src/main/resources/crawler/contentlength.xml
<!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" "http://dbflute.org/meta/lastadi10.dtd"> <components namespace="fessCrawler"> <include path="crawler/container.xml" /> <component name="contentLengthHelper" class="org.codelibs.fess.crawler.helper.ContentLengthHelper" instance="singleton"> <property name="defaultMaxLength">10485760</property><!-- 10M --> <postConstruct name="addMaxLength"> <arg>"text/html"</arg>
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Sun Oct 11 06:51:14 UTC 2015 - 561 bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java
import java.util.regex.Pattern; import javax.xml.xpath.XPathNodes; import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExtractException; import org.codelibs.fess.crawler.util.XPathAPI; import org.codelibs.nekohtml.parsers.DOMParser; import org.w3c.dom.Document; import org.w3c.dom.Node;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10.3K bytes - Viewed (0)