- Sort Score
- Result 10 results
- Languages All
Results 231 - 240 of 460 for Crawler (0.12 sec)
-
src/main/java/org/codelibs/fess/app/web/admin/webconfig/CreateForm.java
* Document URL patterns to exclude from search index. */ @CustomSize(maxKey = "form.admin.max.input.size") public String excludedDocUrls; /** * Additional configuration parameters for the crawler. */ @CustomSize(maxKey = "form.admin.max.input.size") public String configParameter; /** * The maximum crawling depth from the starting URLs. */ @Min(value = 0)
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 5.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java
import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExtractException; import org.codelibs.fess.crawler.extractor.Extractor; import org.codelibs.fess.crawler.util.TextUtil; import org.xml.sax.ContentHandler; import org.xml.sax.SAXException;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 30.7K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/pager/SchedulerPager.java
*/ public String cronExpression; /** * Script type of the scheduled job. */ public String scriptType; /** * Whether the scheduled job is a crawler job. */ public String crawler; /** * Whether logging is enabled for the scheduled job. */ public String jobLogging; /** * Whether the scheduled job is available. */
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 6.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/ContentLengthHelper.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.helper; import java.util.HashMap; import java.util.Map; import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.crawler.exception.CrawlerSystemException; /** * Helper class for managing content length limits based on MIME types.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.3K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformerTest.java
*/ package org.codelibs.fess.crawler.transformer.impl; import java.util.Map; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.builder.RequestDataBuilder; import org.codelibs.fess.crawler.entity.AccessResultDataImpl; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; import org.codelibs.fess.crawler.exception.CrawlerSystemException;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 13.8K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/opensearch/config/bsentity/dbmeta/ScheduledJobDbm.java
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 13.4K bytes - Viewed (0) -
fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/service/impl/OpenSearchDataServiceTest.java
*/ package org.codelibs.fess.crawler.service.impl; import static org.codelibs.opensearch.runner.OpenSearchRunner.newConfigs; import java.util.ArrayList; import java.util.List; import java.util.UUID; import org.codelibs.fess.crawler.client.FesenClient; import org.codelibs.fess.crawler.entity.AccessResult; import org.codelibs.fess.crawler.entity.OpenSearchAccessResult;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 6.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java
import org.apache.logging.log4j.Logger; import org.codelibs.core.io.InputStreamUtil; import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExtractException; /** * Abstract base class for XML extractors.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 8.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/DefaultIntervalController.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.interval.impl; import java.util.Map; import org.codelibs.core.lang.ThreadUtil; /** * Default implementation of the IntervalController. * This class provides a default way to manage delays between crawler operations. * It allows setting delays before processing, after processing, when no URLs are in the queue,
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/service/UrlQueueService.java
* either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.service; import java.util.List; import org.codelibs.fess.crawler.entity.UrlQueue; /** * Service interface for managing URL queues. * Provides methods for adding, retrieving, and managing URLs within a crawling session. *
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2.6K bytes - Viewed (0)