- Sort Score
- Result 10 results
- Languages All
Results 11 - 20 of 167 for Crawling (0.83 sec)
-
src/main/resources/fess_label_en.properties
labels.createdTime=Created Time labels.depth=Depth labels.excludedPaths=Excluded Paths for Crawling labels.excludedUrls=Excluded URLs for Crawling labels.excludedDocPaths=Excluded Paths for Searching labels.excludedDocUrls=Excluded URLs for Searching labels.hostname=Hostname labels.id=ID labels.includedPaths=Included Paths for Crawling labels.includedUrls=Included URLs for Crawling labels.includedDocPaths=Included Paths for Searching
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Sat Dec 13 02:21:17 UTC 2025 - 44K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/web/api/admin/crawlinginfo/ApiAdminCrawlinginfoAction.java
.status(ApiResult.Status.OK) .result()); } /** * Retrieves a specific crawling info log by ID. * * @param id the ID of the crawling info log to retrieve * @return JSON response containing the crawling info log data */ // GET /api/admin/crawlinginfo/log/{id} @Execute public JsonResponse<ApiResult> get$log(final String id) {
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 6.1K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/web/api/admin/crawlinginfo/SearchBody.java
import org.codelibs.fess.app.web.api.admin.BaseSearchBody; /** * Search request body for crawling information administration. * Extends BaseSearchBody with crawling information-specific search parameters. */ public class SearchBody extends BaseSearchBody { /** The crawling session ID to search for. */ public String sessionId; /** * Default constructor for SearchBody. */Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 1.1K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/web/api/admin/webconfig/SearchBody.java
import org.codelibs.fess.app.web.api.admin.BaseSearchBody; /** * Search request body for web crawling configuration administration API. */ public class SearchBody extends BaseSearchBody { /** * Default constructor. */ public SearchBody() { super(); } /** Name of the web crawling configuration */ public String name; /** URLs to crawl */ public String urls;Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 1.2K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/web/admin/crawlinginfo/SearchForm.java
*/ package org.codelibs.fess.app.web.admin.crawlinginfo; /** * The search form for Crawling Info. */ public class SearchForm { /** * Default constructor for SearchForm. */ public SearchForm() { } /** * The session ID field for searching crawling information. */ public String sessionId;Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 952 bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/web/admin/general/EditForm.java
@Size(max = 10) public String thumbnail; /** * Types of crawling failures to ignore during crawling operations. * Specified failure types will not be logged or counted as errors. */ @Size(max = 1000) public String ignoreFailureType; /** * Threshold for failure count before stopping crawling of a URL. * Set to -1 to disable the threshold check. */ @RequiredRegistered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Sat Dec 13 02:21:17 UTC 2025 - 10.6K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/job/CrawlJob.java
/** * The namespace identifier for the crawling session. * Used to organize and identify crawling activities in the system. * Defaults to the system crawling info name. */ protected String namespace = Constants.CRAWLING_INFO_SYSTEM_NAME; /** * Array of web crawling configuration IDs to process.Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Nov 28 16:29:12 UTC 2025 - 19.6K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/exec/Crawler.java
* <ul> * <li>Web crawling - crawls web sites and web content</li> * <li>File system crawling - crawls file systems and documents</li> * <li>Data store crawling - crawls databases and other data sources</li> * <li>Combined crawling - runs multiple crawling types simultaneously</li> * </ul> * * <p>Command line usage: * <pre> * java org.codelibs.fess.exec.Crawler [options...]
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Nov 28 16:29:12 UTC 2025 - 31.4K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/helper/CrawlingConfigHelper.java
import com.google.common.cache.Cache; import com.google.common.cache.CacheBuilder; import jakarta.annotation.PostConstruct; /** * Helper class for managing crawling configurations. * Provides functionality to store, retrieve, and manage different types of crawling configurations * including web, file, and data configurations. Supports caching and session-based configuration management. */ public class CrawlingConfigHelper {Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Nov 28 16:29:12 UTC 2025 - 19.5K bytes - Viewed (1) -
CLAUDE.md
- Graceful degradation (e.g., robots.txt parsing continues on errors) --- ## Key Components ### Crawler (`Crawler.java`) Main orchestrator for crawling operations. **Key Methods**: ```java String execute() // Start crawling, return session ID void addUrl(String url) // Add URL to queue void cleanup(String sessionId) // Clean up session void stop() // Stop gracefully
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Fri Nov 28 17:31:34 UTC 2025 - 10.7K bytes - Viewed (0)