- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 197 for Crawled (0.03 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/UrlFilter.java
/** * Add an url pattern as a target. * * @param urlPattern Regular expression that is crawled */ void addInclude(String urlPattern); /** * Add an url pattern as a non-target. * * @param urlPattern Regular expression that is not crawled */ void addExclude(String urlPattern); /** * Process an url when it's added as a seed url. *Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 1.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java
import org.codelibs.fess.crawler.entity.Sitemap; import org.codelibs.fess.crawler.entity.SitemapSet; import org.codelibs.fess.crawler.exception.ChildUrlsException; import org.codelibs.fess.crawler.helper.SitemapsHelper; import org.codelibs.fess.crawler.processor.ResponseProcessor; import jakarta.annotation.Resource; /** * A response processor implementation that handles sitemaps.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/ExtractException.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.exception; /** * Exception thrown during the extraction process in the crawler. * This exception indicates a failure or error that occurred while extracting content from a crawled resource. * It extends {@link org.codelibs.fess.crawler.exception.CrawlerSystemException} and provides constructorsRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ExtractData.java
import org.apache.tika.metadata.Message; import org.apache.tika.metadata.TIFF; import org.apache.tika.metadata.TikaCoreProperties; import org.apache.tika.metadata.TikaMimeKeys; /** * Represents extracted data from a crawled resource, including content and metadata. */ public class ExtractData implements TikaCoreProperties, CreativeCommons, Geographic, HttpHeaders, Message, ClimateForcast, TIFF, TikaMimeKeys, Serializable {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 3.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/UrlQueueImpl.java
* either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.entity; /** * Implementation of the {@link UrlQueue} interface. * This class represents a URL to be crawled, storing its ID, session ID, * HTTP method, URL, metadata, encoding, parent URL, depth, last modified time, * creation time, and weight. *Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 6.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CrawlingParameterUtil.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.util; import org.codelibs.fess.crawler.CrawlerContext; import org.codelibs.fess.crawler.entity.AccessResult; import org.codelibs.fess.crawler.entity.UrlQueue; import org.codelibs.fess.crawler.service.DataService; import org.codelibs.fess.crawler.service.UrlQueueService; /**
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 6.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/UrlQueueServiceImpl.java
import org.codelibs.fess.crawler.entity.UrlQueue; import org.codelibs.fess.crawler.entity.UrlQueueImpl; import org.codelibs.fess.crawler.helper.MemoryDataHelper; import org.codelibs.fess.crawler.service.UrlQueueService; import jakarta.annotation.Resource; /** * Implementation of the {@link UrlQueueService} interface. * This class provides methods for managing a queue of URLs to be crawled,Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 9.3K bytes - Viewed (0) -
fess-crawler-lasta/src/main/resources/crawler.xml
<components namespace="fessCrawler"> <include path="crawler/container.xml"/> <include path="crawler/client.xml"/> <include path="crawler/rule.xml"/> <include path="crawler/filter.xml"/> <include path="crawler/interval.xml"/> <include path="crawler/extractor.xml"/> <include path="crawler/mimetype.xml"/> <include path="crawler/encoding.xml"/> <include path="crawler/urlconverter.xml"/> <include path="crawler/log.xml"/>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Tue Nov 28 13:40:25 UTC 2017 - 1.7K bytes - Viewed (0) -
fess-crawler-opensearch/src/main/resources/crawler_opensearch.xml
<components namespace="fessCrawler"> <include path="crawler/container.xml"/> <include path="crawler/client.xml"/> <include path="crawler/rule.xml"/> <include path="crawler/filter.xml"/> <include path="crawler/interval.xml"/> <include path="crawler/extractor.xml"/> <include path="crawler/mimetype.xml"/> <include path="crawler/encoding.xml"/> <include path="crawler/urlconverter.xml"/> <include path="crawler/log.xml"/>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Nov 07 04:44:10 UTC 2024 - 2.2K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/TextTransformerTest.java
*/ package org.codelibs.fess.crawler.transformer.impl; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.container.StandardCrawlerContainer; import org.codelibs.fess.crawler.entity.AccessResultDataImpl; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; import org.codelibs.fess.crawler.exception.CrawlerSystemException;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 4.6K bytes - Viewed (0)