- Sort Score
- Result 10 results
- Languages All
Results 61 - 70 of 529 for crawlen (0.51 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/MemoryDataHelper.java
*/ package org.codelibs.fess.crawler.helper; import java.util.ArrayList; import java.util.HashMap; import java.util.LinkedList; import java.util.List; import java.util.Map; import java.util.Queue; import java.util.regex.Pattern; import org.codelibs.fess.crawler.entity.AccessResultImpl; import org.codelibs.fess.crawler.entity.UrlQueueImpl; /**
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 8.1K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/web/admin/general/EditForm.java
* including crawling behavior, authentication, logging, and various system parameters. * */ public class EditForm { /** * Creates a new EditForm instance. */ public EditForm() { // Default constructor } /** * Enable or disable incremental crawling. * When enabled, only new or modified documents are crawled. */ @Size(max = 10)Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Sat Dec 13 02:21:17 UTC 2025 - 10.6K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/ingest/Ingester.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.ingest; import java.util.Map; import org.codelibs.fess.crawler.entity.AccessResult; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; import org.codelibs.fess.entity.DataStoreParams; import org.codelibs.fess.util.ComponentUtil; /**
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 4.1K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/interval/FessIntervalController.java
* either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.interval; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.fess.crawler.interval.impl.DefaultIntervalController; import org.codelibs.fess.helper.IntervalControlHelper; import org.codelibs.fess.util.ComponentUtil; /**
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Wed Nov 19 07:09:17 UTC 2025 - 5.1K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/helper/ProtocolHelper.java
import jakarta.annotation.PostConstruct; /** * Helper class for managing and validating URL protocols in Fess crawling system. * This class handles the initialization and validation of web and file protocols * used by the crawler to determine which URLs can be crawled. */ public class ProtocolHelper { private static final Logger logger = LogManager.getLogger(ProtocolHelper.class);Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Dec 12 13:58:40 UTC 2025 - 12.4K bytes - Viewed (1) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java
import java.util.concurrent.atomic.AtomicInteger; import org.codelibs.core.collection.LruHashSet; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.filter.UrlFilter; import org.codelibs.fess.crawler.interval.IntervalController; import org.codelibs.fess.crawler.rule.Rule; import org.codelibs.fess.crawler.rule.RuleManager; import org.dbflute.utflute.core.PlainTestCase; /** * Test class for CrawlerContext.
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 25.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java
import org.codelibs.core.lang.SystemUtil; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.CrawlerContext; import org.codelibs.fess.crawler.container.CrawlerContainer; import org.codelibs.fess.crawler.entity.AccessResult; import org.codelibs.fess.crawler.entity.RequestData; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; import org.codelibs.fess.crawler.entity.UrlQueue;
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 12.5K bytes - Viewed (0) -
src/main/resources/fess_config.properties
# Encoding for crawling data. crawler.crawling.data.encoding=UTF-8 # Supported web protocols for crawling. crawler.web.protocols=http,https # Supported file protocols for crawling. crawler.file.protocols=file,smb,smb1,ftp,storage,s3,gcs # Pattern for environment variable keys in crawling data. crawler.data.env.param.key.pattern=^FESS_ENV_.* # Whether to ignore robots.txt during crawling. crawler.ignore.robots.txt=false
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Dec 11 09:47:03 UTC 2025 - 54.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/FileTransformer.java
import org.codelibs.core.io.CopyUtil; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.entity.AccessResultData; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; /** * <p> * FileTransformer stores the content of a crawled resource as a file on the file system.
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 11.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/RobotsTxtException.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.exception; /** * RobotsTxtException is an exception class that represents an error related to robots.txt processing during web crawling. * It extends CrawlerSystemException and provides constructors to create instances with a message and/or a cause. * */
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.5K bytes - Viewed (0)