- Sort Score
- Num 10 results
- Language All
Results 51 - 60 of 125 for crawling (0.04 seconds)
-
src/main/java/org/codelibs/fess/crawler/interval/FessIntervalController.java
import org.codelibs.fess.util.ComponentUtil; /** * FessIntervalController extends DefaultIntervalController to provide * Fess-specific interval control functionality for web crawling operations. * This controller manages delays and timing for various crawling states * including processing delays, queue waiting times, and new URL discovery. */ public class FessIntervalController extends DefaultIntervalController {Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Wed Nov 19 07:09:17 GMT 2025 - 5.1K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/app/service/RequestHeaderService.java
import org.dbflute.optional.OptionalEntity; import jakarta.annotation.Resource; /** * Service class for managing request headers used in web crawling configurations. * This service provides CRUD operations for request headers that are applied * during web crawling to configure HTTP request behavior. * */ public class RequestHeaderService { /** * Behavior for request header database operations. */Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Jul 17 08:28:31 GMT 2025 - 5.2K bytes - Click Count (0) -
README.md
You can register crawling targets in the Admin UI on the (Web, File, Data Store) crawler configuration pages, and then start the Crawler manually on the [Scheduler page](https://fess.codelibs.org/15.5/admin/scheduler-guide.html). ## Migration from another search provider Please see [MIGRATION.md](MIGRATION.md). ## Data Store
Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Sat Feb 14 03:19:23 GMT 2026 - 7.8K bytes - Click Count (2) -
src/main/java/org/codelibs/fess/helper/ProtocolHelper.java
import org.codelibs.fess.mylasta.direction.FessConfig; import org.codelibs.fess.util.ComponentUtil; import jakarta.annotation.PostConstruct; /** * Helper class for managing and validating URL protocols in Fess crawling system. * This class handles the initialization and validation of web and file protocols * used by the crawler to determine which URLs can be crawled. */ public class ProtocolHelper {Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Mar 26 13:59:25 GMT 2026 - 12.4K bytes - Click Count (1) -
src/main/java/org/codelibs/fess/app/web/admin/duplicatehost/CreateForm.java
import jakarta.validation.constraints.Size; /** * Form class for creating new duplicate host configuration entries. * This form handles the creation of duplicate host mappings that redirect * crawling from duplicate hostnames to the regular canonical hostname. */ public class CreateForm { /** * Creates a new CreateForm instance. */ public CreateForm() { }Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Jul 17 08:28:31 GMT 2025 - 2.5K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/app/web/admin/duplicatehost/EditForm.java
* including tracking information for optimistic locking and audit trails. * Duplicate hosts are used to define which domains should be treated as the same site for crawling purposes. * */ public class EditForm extends CreateForm { /** * Creates a new EditForm instance. */ public EditForm() { super(); } /**Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Jul 17 08:28:31 GMT 2025 - 2.4K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/app/service/WebConfigService.java
import org.dbflute.optional.OptionalEntity; import jakarta.annotation.Resource; /** * Service class for managing web crawling configurations. * Provides CRUD operations for web configuration settings including * listing, retrieving, storing, and deleting web crawling configurations. */ public class WebConfigService extends FessAppService { /** * Default constructor. */Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Jul 17 08:28:31 GMT 2025 - 6.6K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/app/web/admin/scheduler/CreateForm.java
/** * The script data or code for the scheduled job. */ @CustomSize(maxKey = "form.admin.max.input.size") public String scriptData; /** * Whether this job is related to crawling. */ public String crawler; /** * Whether job logging is enabled. */ public String jobLogging; /** * Whether the scheduled job is available/enabled. */Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Jul 17 08:28:31 GMT 2025 - 3.2K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/crawler/processor/FessResponseProcessor.java
* This processor extends DefaultResponseProcessor to provide additional * processing capabilities through the ingest framework, allowing for * custom data transformation and enrichment during the crawling process. * * <p>It supports pluggable ingesters that can modify the result data * before it is stored in the search index.</p> */ public class FessResponseProcessor extends DefaultResponseProcessor { /**Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Jul 17 08:28:31 GMT 2025 - 3.7K bytes - Click Count (0) -
src/main/java/org/codelibs/fess/app/web/api/admin/fileconfig/ApiAdminFileconfigAction.java
import jakarta.annotation.Resource; /** * API action for admin file configuration management. * Provides RESTful API endpoints for managing file crawling configuration settings in the Fess search engine. * File configurations define settings for crawling file systems, FTP servers, and other file-based data sources. * */ public class ApiAdminFileconfigAction extends FessApiAdminAction {Created: Tue Mar 31 13:07:34 GMT 2026 - Last Modified: Thu Aug 07 03:06:29 GMT 2025 - 9.2K bytes - Click Count (0)