- Sort Score
- Result 10 results
- Languages All
Results 71 - 80 of 530 for crawlen (0.23 sec)
-
src/main/java/org/codelibs/fess/util/GsaConfigParser.java
factory.setFeature(org.codelibs.fess.crawler.Constants.FEATURE_EXTERNAL_GENERAL_ENTITIES, false); factory.setFeature(org.codelibs.fess.crawler.Constants.FEATURE_EXTERNAL_PARAMETER_ENTITIES, false); final SAXParser parser = factory.newSAXParser(); parser.setProperty(XMLConstants.ACCESS_EXTERNAL_DTD, StringUtil.EMPTY); parser.setProperty(XMLConstants.ACCESS_EXTERNAL_SCHEMA, StringUtil.EMPTY);
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Nov 28 16:29:12 UTC 2025 - 21.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/MaxLengthExceededException.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.exception; /** * MaxLengthExceededException is thrown when the content length exceeds the maximum allowed length. * It extends CrawlingAccessException, indicating a crawling-related access issue. * */ public class MaxLengthExceededException extends CrawlingAccessException {Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.2K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java
import java.util.concurrent.atomic.AtomicInteger; import org.codelibs.core.collection.LruHashSet; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.filter.UrlFilter; import org.codelibs.fess.crawler.interval.IntervalController; import org.codelibs.fess.crawler.rule.Rule; import org.codelibs.fess.crawler.rule.RuleManager; import org.dbflute.utflute.core.PlainTestCase; /** * Test class for CrawlerContext.
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 25.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/RobotsTxtException.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.exception; /** * RobotsTxtException is an exception class that represents an error related to robots.txt processing during web crawling. * It extends CrawlerSystemException and provides constructors to create instances with a message and/or a cause. * */
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/service/UrlQueueService.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.service; import java.util.List; import org.codelibs.fess.crawler.entity.UrlQueue; /** * Service interface for managing URL queues. * Provides methods for adding, retrieving, and managing URLs within a crawling session. * * @param <QUEUE> the type of URL queue */
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/fs/FileSystemClient.java
import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.builder.RequestDataBuilder; import org.codelibs.fess.crawler.client.AbstractCrawlerClient; import org.codelibs.fess.crawler.client.AccessTimeoutTarget; import org.codelibs.fess.crawler.entity.RequestData; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.exception.ChildUrlsException;
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Nov 23 12:19:14 UTC 2025 - 15.1K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java
/** The key of the configuration. e.g. u002eu06d4u2e3cu3002 */ String CRAWLER_DOCUMENT_FULLSTOP_CHARS = "crawler.document.fullstop.chars"; /** The key of the configuration. e.g. UTF-8 */ String CRAWLER_CRAWLING_DATA_ENCODING = "crawler.crawling.data.encoding"; /** The key of the configuration. e.g. http,https */ String CRAWLER_WEB_PROTOCOLS = "crawler.web.protocols";Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Sat Dec 13 02:21:17 UTC 2025 - 525.7K bytes - Viewed (2) -
src/main/java/org/codelibs/fess/app/web/api/admin/webconfig/SearchBody.java
/** * Search request body for web crawling configuration administration API. */ public class SearchBody extends BaseSearchBody { /** * Default constructor. */ public SearchBody() { super(); } /** Name of the web crawling configuration */ public String name; /** URLs to crawl */ public String urls;Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 1.2K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ExtractData.java
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, * either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.entity; import java.io.Serializable; import java.util.HashMap; import java.util.Map; import java.util.Set; import org.apache.tika.metadata.ClimateForcast; import org.apache.tika.metadata.CreativeCommons;
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 3.8K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/web/admin/scheduler/CreateForm.java
* The script data or code for the scheduled job. */ @CustomSize(maxKey = "form.admin.max.input.size") public String scriptData; /** * Whether this job is related to crawling. */ public String crawler; /** * Whether job logging is enabled. */ public String jobLogging; /** * Whether the scheduled job is available/enabled. */Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 3.2K bytes - Viewed (0)