- Sort Score
- Result 10 results
- Languages All
Results 181 - 190 of 460 for Crawler (0.03 sec)
-
fess-crawler-lasta/src/main/resources/crawler/urlconverter.xml
<!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" "http://dbflute.org/meta/lastadi10.dtd"> <components namespace="fessCrawler"> <include path="crawler/container.xml" /> <!-- Converts child links to normalize it. --> <component name="urlConvertHelper" class="org.codelibs.fess.crawler.helper.UrlConvertHelper"> </component>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 394 bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/NullResponseProcessor.java
* either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.processor.impl; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.processor.ResponseProcessor; /** * NullResponseProcessor is a class that implements the ResponseProcessor interface.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.5K bytes - Viewed (0) -
src/main/resources/crawler/extractor+tikaExtractor.xml
<!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" "http://dbflute.org/meta/lastadi10.dtd"> <components namespace="fessCrawler"> <include path="crawler/container.xml" /> <component name="tikaExtractor" class="org.codelibs.fess.crawler.extractor.impl.TikaExtractor"> <property name="maxCompressionRatio">2</property> <property name="maxUncompressionSize">10000000</property> </component>
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Sun Aug 25 12:46:12 UTC 2019 - 461 bytes - Viewed (0) -
src/main/java/org/codelibs/fess/Constants.java
public static final String CRAWLER_START_TIME = "CrawlerStartTime"; /** Info map key for crawler end time. */ public static final String CRAWLER_END_TIME = "CrawlerEndTime"; /** Info map key for crawler execution time. */ public static final String CRAWLER_EXEC_TIME = "CrawlerExecTime"; /** Info map key for web/file system crawler start time. */
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 34.6K bytes - Viewed (0) -
src/main/resources/crawler/contentlength.xml
<!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" "http://dbflute.org/meta/lastadi10.dtd"> <components namespace="fessCrawler"> <include path="crawler/container.xml" /> <component name="contentLengthHelper" class="org.codelibs.fess.crawler.helper.ContentLengthHelper" instance="singleton"> <property name="defaultMaxLength">10485760</property><!-- 10M --> <postConstruct name="addMaxLength"> <arg>"text/html"</arg>
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Sun Oct 11 06:51:14 UTC 2015 - 561 bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/FilenameExtractor.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.extractor.impl; import java.io.InputStream; import java.util.Map; import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExtractException; /** * Extracts the filename from the parameters.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsVisioExtractor.java
*/ package org.codelibs.fess.crawler.extractor.impl; import java.io.IOException; import java.io.InputStream; import java.util.Map; import org.apache.poi.hdgf.extractor.VisioTextExtractor; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExtractException; /** * Gets a text from . file.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/Rule.java
*/ package org.codelibs.fess.crawler.rule; import java.io.Serializable; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.processor.ResponseProcessor; /** * The Rule interface defines the contract for implementing rules that can be applied to * response data in a web crawler. Implementations of this interface should provide logic
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 1.7K bytes - Viewed (0) -
fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/util/OpenSearchCrawlerConfig.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.util; /** * Configuration class for OpenSearch crawler settings. * This class provides configuration for index names, shards, and replicas * for the queue, data, and filter indices used by the crawler. */ public class OpenSearchCrawlerConfig { /** * Constructs a new OpenSearchCrawlerConfig. */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 5.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/CommandExtractor.java
import org.codelibs.core.lang.StringUtil; import org.codelibs.core.lang.ThreadUtil; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExecutionTimeoutException; import org.codelibs.fess.crawler.exception.ExtractException; /** * Extracts text content by executing an external command. */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 16K bytes - Viewed (0)