- Sort Score
- Result 10 results
- Languages All
Results 81 - 90 of 397 for Crawler (0.1 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractor.java
import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.exception.ExtractException; import org.codelibs.fess.crawler.exception.MaxLengthExceededException; import org.codelibs.fess.crawler.extractor.Extractor; import org.codelibs.fess.crawler.extractor.ExtractorFactory; import org.codelibs.fess.crawler.helper.MimeTypeHelper;
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 4.8K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TextExtractorTest.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.extractor.impl; import java.io.InputStream; import org.codelibs.core.io.CloseableUtil; import org.codelibs.core.io.ResourceUtil; import org.codelibs.fess.crawler.container.StandardCrawlerContainer; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.dbflute.utflute.core.PlainTestCase; import org.slf4j.Logger;
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 2K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/TextTransformerTest.java
*/ package org.codelibs.fess.crawler.transformer.impl; import org.codelibs.fess.crawler.Constants; import org.codelibs.fess.crawler.container.StandardCrawlerContainer; import org.codelibs.fess.crawler.entity.AccessResultDataImpl; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; import org.codelibs.fess.crawler.exception.CrawlerSystemException;
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 4.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java
import org.codelibs.fess.crawler.entity.Sitemap; import org.codelibs.fess.crawler.entity.SitemapSet; import org.codelibs.fess.crawler.exception.ChildUrlsException; import org.codelibs.fess.crawler.helper.SitemapsHelper; import org.codelibs.fess.crawler.processor.ResponseProcessor; import jakarta.annotation.Resource; /** * @author shinsuke * */ public class SitemapsResponseProcessor implements ResponseProcessor {
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:47:32 UTC 2024 - 2.4K bytes - Viewed (0) -
src/main/resources/crawler/transformer.xml
<!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" "http://dbflute.org/meta/lastadi10.dtd"> <components namespace="fessCrawler"> <include path="crawler/transformer_basic.xml"/> <component name="fessXpathTransformer" class="org.codelibs.fess.crawler.transformer.FessXpathTransformer" instance="singleton"> <property name="name">"fessXpathTransformer"</property> <property name="featureMap">defaultFeatureMap</property>
Registered: Thu Oct 31 13:40:30 UTC 2024 - Last Modified: Thu Jan 10 03:35:10 UTC 2019 - 1.6K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/es/config/exentity/FileConfig.java
import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.Constants; import org.codelibs.fess.app.service.FileAuthenticationService; import org.codelibs.fess.crawler.client.CrawlerClientFactory; import org.codelibs.fess.crawler.client.ftp.FtpAuthentication; import org.codelibs.fess.crawler.client.smb.SmbAuthentication; import org.codelibs.fess.es.config.bsentity.BsFileConfig; import org.codelibs.fess.helper.SystemHelper;
Registered: Thu Oct 31 13:40:30 UTC 2024 - Last Modified: Thu Feb 22 01:37:57 UTC 2024 - 9.8K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java
/** The key of the configuration. e.g. false */ String CRAWLER_DOCUMENT_APPEND_FILENAME = "crawler.document.append.filename"; /** The key of the configuration. e.g. 20 */ String CRAWLER_DOCUMENT_MAX_ALPHANUM_TERM_SIZE = "crawler.document.max.alphanum.term.size"; /** The key of the configuration. e.g. 10 */
Registered: Thu Oct 31 13:40:30 UTC 2024 - Last Modified: Fri Oct 11 21:11:58 UTC 2024 - 468.5K bytes - Viewed (1) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/UrlFilterServiceImpl.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.service.impl; import java.util.List; import java.util.regex.Pattern; import org.codelibs.fess.crawler.helper.MemoryDataHelper; import org.codelibs.fess.crawler.service.UrlFilterService; import jakarta.annotation.Resource; /** * @author shinsuke * */
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:47:32 UTC 2024 - 3.6K bytes - Viewed (0) -
src/main/resources/fess_config.properties
crawler.ignore.robots.tags=false crawler.ignore.content.exception=true crawler.failure.url.status.codes=404 crawler.system.monitor.interval=60 crawler.hotthread.ignore_idle_threads=true crawler.hotthread.interval=500ms crawler.hotthread.snapshots=10 crawler.hotthread.threads=3 crawler.hotthread.timeout=30s crawler.hotthread.type=cpu crawler.metadata.content.excludes=resourceName,X-Parsed-By,Content-Encoding.*,Content-Type.*,X-TIKA.*,X-FESS.*
Registered: Thu Oct 31 13:40:30 UTC 2024 - Last Modified: Tue Oct 01 14:13:38 UTC 2024 - 30.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClient.java
* either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.client; import java.util.Map; import org.codelibs.fess.crawler.entity.RequestData; import org.codelibs.fess.crawler.entity.ResponseData; /** * @author shinsuke * */ public interface CrawlerClient extends AutoCloseable {
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 1K bytes - Viewed (0)