- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 172 for crawled (0.27 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java
* * <p>Example usage: * <pre> * Crawler crawler = new Crawler(); * crawler.addUrl("http://example.com/"); * crawler.execute(); * crawler.close(); * </pre> */ public class Crawler implements Runnable, AutoCloseable { private static final Logger logger = LogManager.getLogger(Crawler.class); /** * Service for managing URL queues during crawling. */
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Mon Nov 24 03:59:47 UTC 2025 - 17K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/job/CrawlJob.java
* This job launches a separate crawler process that can crawl web sites, file systems, * and data sources based on the configured crawling settings. * * <p>The job supports selective crawling by specifying configuration IDs for different * types of crawlers (web, file, data). It manages the crawler process lifecycle, * handles timeout scenarios, and ensures proper cleanup of resources.</p> *
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Nov 28 16:29:12 UTC 2025 - 19.6K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/indexer/IndexUpdater.java
import org.codelibs.fess.Constants; import org.codelibs.fess.crawler.Crawler; import org.codelibs.fess.crawler.entity.AccessResult; import org.codelibs.fess.crawler.entity.AccessResultData; import org.codelibs.fess.crawler.entity.OpenSearchAccessResult; import org.codelibs.fess.crawler.entity.OpenSearchUrlQueue; import org.codelibs.fess.crawler.service.DataService; import org.codelibs.fess.crawler.service.UrlFilterService;
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Nov 28 16:29:12 UTC 2025 - 32.9K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/web/admin/general/EditForm.java
// Default constructor } /** * Enable or disable incremental crawling. * When enabled, only new or modified documents are crawled. */ @Size(max = 10) public String incrementalCrawling; /** * Number of days to keep crawled documents before cleanup. * Set to -1 to disable automatic cleanup. */ @Required @Min(-1) @Max(1000) @ValidateTypeFailureRegistered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Sat Dec 13 02:21:17 UTC 2025 - 10.6K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/ds/callback/FileListIndexUpdateCallbackImpl.java
import org.codelibs.fess.Constants; import org.codelibs.fess.crawler.builder.RequestDataBuilder; import org.codelibs.fess.crawler.client.CrawlerClient; import org.codelibs.fess.crawler.client.CrawlerClientFactory; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; import org.codelibs.fess.crawler.exception.ChildUrlsException; import org.codelibs.fess.crawler.exception.CrawlerSystemException;
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Nov 28 16:29:12 UTC 2025 - 29.7K bytes - Viewed (3) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CrawlingParameterUtil.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.util; import org.codelibs.fess.crawler.CrawlerContext; import org.codelibs.fess.crawler.entity.AccessResult; import org.codelibs.fess.crawler.entity.UrlQueue; import org.codelibs.fess.crawler.service.DataService; import org.codelibs.fess.crawler.service.UrlQueueService; /**
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Nov 22 13:28:22 UTC 2025 - 6.4K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/helper/DataIndexHelper.java
/** * Interval in milliseconds between crawler thread executions. * Used to control the rate at which new crawler threads are started * and the frequency of status checks. */ protected long crawlingExecutionInterval = Constants.DEFAULT_CRAWLING_EXECUTION_INTERVAL; /** * Thread priority for crawler threads. * Defaults to normal thread priority. */Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Nov 28 16:29:12 UTC 2025 - 19K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java
import org.codelibs.fess.app.service.FailureUrlService; import org.codelibs.fess.crawler.builder.RequestDataBuilder; import org.codelibs.fess.crawler.client.CrawlerClient; import org.codelibs.fess.crawler.entity.RequestData; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.UrlQueue; import org.codelibs.fess.crawler.log.LogType; import org.codelibs.fess.exception.ContainerNotAvailableException;
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Dec 11 09:47:03 UTC 2025 - 19.5K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/util/PrunedTag.java
* This class defines tag patterns that match HTML elements based on tag name, CSS class, ID, or custom attributes. * It is used to identify and remove unwanted HTML elements from crawled documents. */ public class PrunedTag { /** The HTML tag name to match (e.g., "div", "span", "p") */ private final String tag; /** The ID attribute value to match */ private String id;Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Mon Nov 24 04:23:08 UTC 2025 - 7.1K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/transformer/FessTransformer.java
import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.Constants; import org.codelibs.fess.crawler.entity.AccessResult; import org.codelibs.fess.crawler.entity.AccessResultData; import org.codelibs.fess.crawler.entity.UrlQueue; import org.codelibs.fess.crawler.util.CrawlingParameterUtil; import org.codelibs.fess.crawler.util.FieldConfigs; import org.codelibs.fess.mylasta.direction.FessConfig;
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Dec 11 09:47:03 UTC 2025 - 14.1K bytes - Viewed (0)