- Sort Score
- Result 10 results
- Languages All
Results 51 - 60 of 441 for CRAWLER (4.98 sec)
-
src/main/java/org/codelibs/fess/ds/callback/FileListIndexUpdateCallbackImpl.java
import org.codelibs.fess.Constants; import org.codelibs.fess.crawler.builder.RequestDataBuilder; import org.codelibs.fess.crawler.client.CrawlerClient; import org.codelibs.fess.crawler.client.CrawlerClientFactory; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; import org.codelibs.fess.crawler.exception.ChildUrlsException; import org.codelibs.fess.crawler.exception.CrawlerSystemException;
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Nov 28 16:29:12 UTC 2025 - 29.7K bytes - Viewed (3) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPublisherExtractor.java
*/ package org.codelibs.fess.crawler.extractor.impl; import java.io.IOException; import java.io.InputStream; import java.util.Map; import org.apache.poi.hpbf.extractor.PublisherTextExtractor; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExtractException; /** * Gets a text from . file.
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Nov 23 12:19:14 UTC 2025 - 2K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java
import org.codelibs.core.lang.SystemUtil; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.CrawlerContext; import org.codelibs.fess.crawler.container.CrawlerContainer; import org.codelibs.fess.crawler.entity.AccessResult; import org.codelibs.fess.crawler.entity.RequestData; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; import org.codelibs.fess.crawler.entity.UrlQueue;
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 12.5K bytes - Viewed (0) -
MIGRATION.md
-F "file=@documents.bulk" ``` ### 4. Direct Crawler Configuration Instead of importing documents, configure Fess to crawl your data sources: **Web Crawling**: - **Admin Path**: Crawler > Web - **Supports**: HTTP/HTTPS websites - **Features**: JavaScript rendering, authentication, custom headers **File Crawling**: - **Admin Path**: Crawler > File - **Supports**: SMB, FTP, local file systems
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Nov 06 12:40:11 UTC 2025 - 23.2K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/IntervalController.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.interval; /** * The {@code IntervalController} interface defines methods for controlling * the delay intervals in a web crawler. It includes constants representing * different types of processing states and a method to introduce a delay * based on the type of processing. * <p>Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/container/CrawlerContainer.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.container; import org.codelibs.core.lang.StringUtil; /** * The CrawlerContainer interface provides methods for managing components * within a crawler container. It includes methods to retrieve components, * check availability, and destroy the container. Additionally, it provides
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 2.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/UrlQueueImpl.java
return id; } /* * (non-Javadoc) * * @see org.codelibs.fess.crawler.entity.UrlQueue#setId(IDTYPE) */ @Override public void setId(final IDTYPE id) { this.id = id; } /* * (non-Javadoc) * * @see org.codelibs.fess.crawler.entity.UrlQueue#getSessionId() */ @Override public String getSessionId() {Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 6.1K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerThreadTest.java
import org.codelibs.fess.crawler.filter.UrlFilter; import org.codelibs.fess.crawler.helper.LogHelper; import org.codelibs.fess.crawler.interval.IntervalController; import org.codelibs.fess.crawler.processor.ResponseProcessor; import org.codelibs.fess.crawler.rule.Rule; import org.codelibs.fess.crawler.rule.RuleManager; import org.codelibs.fess.crawler.service.DataService; import org.codelibs.fess.crawler.service.UrlQueueService;
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Mon Nov 24 03:59:47 UTC 2025 - 18.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/CrawlerLoginFailureException.java
* either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.exception; /** * The crawler login failure exception. * This exception is thrown when the crawler fails to login to a website. * */ public class CrawlerLoginFailureException extends CrawlerSystemException { private static final long serialVersionUID = 1L;Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 1.1K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
import org.codelibs.fess.crawler.container.StandardCrawlerContainer; import org.codelibs.fess.crawler.entity.AccessResultImpl; import org.codelibs.fess.crawler.entity.UrlQueue; import org.codelibs.fess.crawler.entity.UrlQueueImpl; import org.codelibs.fess.crawler.extractor.ExtractorFactory; import org.codelibs.fess.crawler.extractor.impl.TikaExtractor; import org.codelibs.fess.crawler.filter.impl.UrlFilterImpl;
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Tue Nov 11 13:40:14 UTC 2025 - 25.8K bytes - Viewed (0)