- Sort Score
- Result 10 results
- Languages All
Results 81 - 90 of 460 for Crawler (0.7 sec)
-
fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchDataService.java
*/ package org.codelibs.fess.crawler.service.impl; import java.util.List; import java.util.Map; import java.util.function.Consumer; import org.apache.lucene.search.TotalHits; import org.codelibs.core.beans.util.BeanUtil; import org.codelibs.fess.crawler.entity.OpenSearchAccessResult; import org.codelibs.fess.crawler.entity.OpenSearchAccessResultData; import org.codelibs.fess.crawler.exception.OpenSearchAccessException;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 10.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractor.java
import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.ExtractException; import org.codelibs.fess.crawler.extractor.Extractor; import org.codelibs.fess.crawler.extractor.ExtractorFactory; import org.codelibs.fess.crawler.helper.MimeTypeHelper; import jakarta.mail.Address; import jakarta.mail.BodyPart;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 12.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/Transformer.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.transformer; import org.codelibs.fess.crawler.entity.AccessResultData; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; /** * The Transformer interface defines methods for transforming response data
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 1.7K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TarExtractorTest.java
import org.codelibs.core.io.ResourceUtil; import org.codelibs.fess.crawler.container.StandardCrawlerContainer; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.MaxLengthExceededException; import org.codelibs.fess.crawler.extractor.ExtractorFactory; import org.codelibs.fess.crawler.helper.impl.MimeTypeHelperImpl; import org.dbflute.utflute.core.PlainTestCase; /**
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 3.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/AbstractRule.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.rule.impl; import org.codelibs.fess.crawler.container.CrawlerContainer; import org.codelibs.fess.crawler.processor.ResponseProcessor; import org.codelibs.fess.crawler.rule.Rule; import org.codelibs.fess.crawler.rule.RuleManager; import jakarta.annotation.Resource; /**
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Wed Sep 03 14:42:53 UTC 2025 - 2.8K bytes - Viewed (0) -
fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots.txt
User-agent: * Disallow: /private/ Disallow: /help # disallows /help.html, /help/index.html, etc. Allow: /help/faq.html Crawl-delay: 3 User-agent: Crawler Disallow: /aaa User-agent: Crawler/1.0 Disallow: /bbb User-agent: Crawler/2.0 Disallow: /ccc User-agent: Hoge Crawler Disallow: /ddd sitemap: http://www.example.com/sitmap.xml
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 566 bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/util/XmlUtil.java
* <li>org.codelibs.fess.crawler.Constants</li> * <li>org.codelibs.fess.crawler.exception.CrawlerSystemException</li> * <li>org.codelibs.fess.crawler.entity.AccessResultData</li> * <li>org.codelibs.core.lang.StringUtil</li> * </ul> * * @see org.codelibs.fess.crawler.Constants * @see org.codelibs.fess.crawler.exception.CrawlerSystemException * @see org.codelibs.fess.crawler.entity.AccessResultData
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 9.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapFile.java
* Datetime format. * * By providing the last modification timestamp, you enable search engine * crawlers to retrieve only a subset of the Sitemaps in the index i.e. a * crawler may only retrieve Sitemaps that were modified since a certain * date. This incremental Sitemap fetching mechanism allows for the rapid * discovery of new URLs on very large sites.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.4K bytes - Viewed (1) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/pool/CrawlerPooledObjectFactory.java
*/ package org.codelibs.fess.crawler.pool; import org.apache.commons.pool2.BasePooledObjectFactory; import org.apache.commons.pool2.PooledObject; import org.apache.commons.pool2.impl.DefaultPooledObject; import org.codelibs.fess.crawler.container.CrawlerContainer; import jakarta.annotation.Resource; /** * A factory for creating and managing pooled crawler objects.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/builder/RequestDataBuilder.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.builder; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.entity.RequestData; import org.codelibs.fess.crawler.entity.RequestData.Method; /** * Builder class for creating RequestData objects using a fluent interface.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.3K bytes - Viewed (0)