- Sort Score
- Result 10 results
- Languages All
Results 41 - 50 of 524 for crawling (0.06 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CrawlingParameterUtil.java
import org.codelibs.fess.crawler.service.DataService; import org.codelibs.fess.crawler.service.UrlQueueService; /** * Utility class for managing crawling parameters using ThreadLocal variables. * This class provides methods to set and get various parameters related to the crawling process. * * <p>This class is final and cannot be instantiated.</p> * * <p>The following parameters are managed:</p> * <ul>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 6.4K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/web/admin/crawlinginfo/AdminCrawlinginfoAction.java
import org.lastaflute.web.response.HtmlResponse; import org.lastaflute.web.response.render.RenderData; import org.lastaflute.web.ruts.process.ActionRuntime; import jakarta.annotation.Resource; /** * Admin action for Crawling Info management. * */ public class AdminCrawlinginfoAction extends FessAdminAction { /** * Default constructor. */ public AdminCrawlinginfoAction() { super(); }
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 11.4K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/helper/DocumentHelper.java
} } /** * Processes a crawling request for a specific URL. * Executes the full crawling pipeline including client execution, rule processing, * transformation, and data extraction. * * @param crawlingConfig the crawling configuration to use * @param crawlingInfoId the crawling session ID * @param url the URL to process
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 17.2K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/util/GsaConfigParser.java
/** * Parser for Google Search Appliance (GSA) configuration files. * This SAX-based parser reads GSA XML configuration files and converts them into * Fess configuration objects including web crawling configurations, file crawling * configurations, and label types for access control. * * <p>The parser handles the following GSA configuration elements: * <ul> * <li>Collections with good/bad URL patterns</li>
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 21.5K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java
* This class extends the base CrawlerThread and provides Fess-specific functionality for * crawling and indexing documents, including incremental crawling capabilities, content * modification checking, and integration with the Fess search engine backend. * * <p>Key features include:</p> * <ul> * <li>Incremental crawling support with last-modified timestamp checking</li> * <li>Document expiration handling</li>
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 19.1K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/service/FailureUrlService.java
import org.dbflute.optional.OptionalEntity; import jakarta.annotation.Resource; /** * Service class for managing failure URLs that occur during web crawling. * Provides functionality to store, retrieve, and manage failed crawling attempts * with their associated error information. */ public class FailureUrlService { /** Logger instance for this class */
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 9.2K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RequestData.java
import java.util.Objects; import org.codelibs.fess.crawler.Constants; /** * Represents a request data for crawling. * This class encapsulates the HTTP method, URL, and weight associated with a crawling request. */ public class RequestData { /** * HTTP methods supported for crawling requests. */ public enum Method { /** HTTP GET method. */ GET, /** HTTP POST method. */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/web/api/admin/crawlinginfo/EditBody.java
import org.codelibs.fess.app.web.admin.crawlinginfo.EditForm; /** * Request body class for crawling info edit operations in the admin REST API. * This class extends EditForm to inherit the necessary form validation and binding capabilities * for crawling information management operations. */ public class EditBody extends EditForm { /** * Default constructor. */
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 1.1K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/pager/FileConfigPager.java
/** Configuration name */ public String name; /** File system paths to crawl */ public String paths; /** Number of threads for crawling */ public String numOfThread; /** Interval time between crawling operations */ public String intervalTime; /** Boost value for search ranking */ public String boost; /** Availability status of the configuration */
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 7.3K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/transformer/FessXpathTransformer.java
putResultDataBody(dataMap, fessConfig.getIndexFieldContent(), content); } } /** * Retrieves the crawling configuration for the given response data. * * @param responseData the response data from crawling * @return the crawling configuration */ protected CrawlingConfig getCrawlingConfig(final ResponseData responseData) {
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 54.4K bytes - Viewed (0)