Search Options

Results per page
Sort
Preferred Languages
Advance

Results 51 - 60 of 954 for crawled (0.12 sec)

  1. src/main/java/org/codelibs/fess/crawler/transformer/FessStandardTransformer.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.transformer;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    import org.codelibs.fess.exception.FessSystemException;
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Feb 22 01:53:18 UTC 2024
    - 2.4K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

    import org.codelibs.fess.crawler.entity.Sitemap;
    import org.codelibs.fess.crawler.entity.SitemapSet;
    import org.codelibs.fess.crawler.exception.ChildUrlsException;
    import org.codelibs.fess.crawler.helper.SitemapsHelper;
    import org.codelibs.fess.crawler.processor.ResponseProcessor;
    
    import jakarta.annotation.Resource;
    
    /**
     * @author shinsuke
     *
     */
    public class SitemapsResponseProcessor implements ResponseProcessor {
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:47:32 UTC 2024
    - 2.4K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/UrlFilterServiceImpl.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.service.impl;
    
    import java.util.List;
    import java.util.regex.Pattern;
    
    import org.codelibs.fess.crawler.helper.MemoryDataHelper;
    import org.codelibs.fess.crawler.service.UrlFilterService;
    
    import jakarta.annotation.Resource;
    
    /**
     * @author shinsuke
     *
     */
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:47:32 UTC 2024
    - 3.6K bytes
    - Viewed (0)
  4. src/main/resources/fess_config.properties

    crawler.ignore.robots.tags=false
    crawler.ignore.content.exception=true
    crawler.failure.url.status.codes=404
    crawler.system.monitor.interval=60
    crawler.hotthread.ignore_idle_threads=true
    crawler.hotthread.interval=500ms
    crawler.hotthread.snapshots=10
    crawler.hotthread.threads=3
    crawler.hotthread.timeout=30s
    crawler.hotthread.type=cpu
    crawler.metadata.content.excludes=resourceName,X-Parsed-By,Content-Encoding.*,Content-Type.*,X-TIKA.*,X-FESS.*
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Tue Oct 01 14:13:38 UTC 2024
    - 30.9K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/BinaryTransformer.java

     */
    package org.codelibs.fess.crawler.transformer.impl;
    
    import java.io.BufferedInputStream;
    import java.io.ByteArrayInputStream;
    import java.io.IOException;
    
    import org.apache.commons.io.IOUtils;
    import org.codelibs.fess.crawler.entity.AccessResultData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 2.8K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java

    import org.codelibs.core.io.FileUtil;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.jodconverter.core.office.OfficeException;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:47:32 UTC 2024
    - 8.2K bytes
    - Viewed (0)
  7. fess-crawler-lasta/src/main/resources/crawler/rule.xml

    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<include path="crawler/transformer.xml" />
    
    	<component name="ruleManager"
    		class="org.codelibs.fess.crawler.rule.impl.RuleManagerImpl" instance="prototype">
    		<postConstruct name="addRule">
    			<arg>sitemapsRule</arg>
    		</postConstruct>
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 1.5K bytes
    - Viewed (0)
  8. src/test/resources/plugin/repo3/index.html

    <a href="fess-crawler-es/" title="fess-crawler-es/">fess-crawler-es/</a>                                                 -         -      
    <a href="fess-crawler-lasta/" title="fess-crawler-lasta/">fess-crawler-lasta/</a>                                              -         -      
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Mon Jun 17 13:30:41 UTC 2024
    - 6.2K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractor.java

    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    import org.codelibs.fess.crawler.exception.MaxLengthExceededException;
    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    import org.codelibs.fess.crawler.helper.MimeTypeHelper;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 4.8K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/es/config/exentity/DataConfig.java

    import org.codelibs.fess.crawler.client.CrawlerClientFactory;
    import org.codelibs.fess.crawler.client.ftp.FtpAuthentication;
    import org.codelibs.fess.crawler.client.ftp.FtpClient;
    import org.codelibs.fess.crawler.client.http.Authentication;
    import org.codelibs.fess.crawler.client.http.HcHttpClient;
    import org.codelibs.fess.crawler.client.http.form.FormScheme;
    import org.codelibs.fess.crawler.client.http.impl.AuthenticationImpl;
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Sat Oct 12 01:54:15 UTC 2024
    - 18.5K bytes
    - Viewed (0)
Back to top