Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 68 for crawler (0.05 sec)

  1. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                crawler1.getCrawlerContext().setMaxAccessCount(maxCount);
                crawler1.getCrawlerContext().setNumOfThread(numOfThread);
    
                Thread.sleep(100);
    
                final Crawler crawler2 = getComponent(Crawler.class);
                crawler2.setBackground(true);
                ((UrlFilterImpl) crawler2.urlFilter).setIncludeFilteringPattern("$1$2$3.*");
                crawler2.addUrl(url2);
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 7.7K bytes
    - Viewed (0)
  2. fess-crawler-opensearch/src/main/resources/crawler_opensearch.xml

    <components namespace="fessCrawler">
        <include path="crawler/container.xml"/>
        <include path="crawler/client.xml"/>
        <include path="crawler/rule.xml"/>
        <include path="crawler/filter.xml"/>
        <include path="crawler/interval.xml"/>
        <include path="crawler/extractor.xml"/>
        <include path="crawler/mimetype.xml"/>
        <include path="crawler/encoding.xml"/>
        <include path="crawler/urlconverter.xml"/>
        <include path="crawler/log.xml"/>
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 2.2K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/UrlQueueImpl.java

        protected float weight = 1.0f;
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.entity.UrlQueue#getId()
         */
        @Override
        public IDTYPE getId() {
            return id;
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.entity.UrlQueue#setId(IDTYPE)
         */
        @Override
        public void setId(final IDTYPE id) {
            this.id = id;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Mon Nov 04 07:44:18 UTC 2024
    - 5.2K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/es/config/exentity/CrawlingConfig.java

    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.Constants;
    import org.codelibs.fess.crawler.client.CrawlerClientFactory;
    import org.codelibs.fess.crawler.client.ftp.FtpClient;
    import org.codelibs.fess.crawler.client.http.HcHttpClient;
    import org.codelibs.fess.crawler.client.smb.SmbClient;
    import org.codelibs.fess.mylasta.direction.FessConfig;
    import org.codelibs.fess.util.ComponentUtil;
    
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Oct 24 13:01:38 UTC 2024
    - 5.5K bytes
    - Viewed (0)
  5. deps.xml

    <project name="deps" basedir=".">
    	<property name="target.dir" value="${basedir}/target/deps" />
    	<property name="webinf.dir" value="${basedir}/src/main/webapp/WEB-INF" />
    	<property name="crawler.dir" value="${basedir}/src/main/webapp/WEB-INF/env/crawler" />
    	<property name="suggest.dir" value="${basedir}/src/main/webapp/WEB-INF/env/suggest" />
    	<property name="thumbnail.dir" value="${basedir}/src/main/webapp/WEB-INF/env/thumbnail" />
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Oct 24 04:37:19 UTC 2024
    - 2.5K bytes
    - Viewed (0)
  6. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchDataService.java

     */
    package org.codelibs.fess.crawler.service.impl;
    
    import java.util.List;
    import java.util.Map;
    import java.util.function.Consumer;
    
    import org.apache.lucene.search.TotalHits;
    import org.codelibs.core.beans.util.BeanUtil;
    import org.codelibs.fess.crawler.entity.OpenSearchAccessResult;
    import org.codelibs.fess.crawler.entity.OpenSearchAccessResultData;
    import org.codelibs.fess.crawler.exception.OpenSearchAccessException;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 8.5K bytes
    - Viewed (0)
  7. pom.xml

    	<groupId>org.codelibs.fess</groupId>
    	<artifactId>fess-crawler-parent</artifactId>
    	<version>15.0.0-SNAPSHOT</version>
    	<packaging>pom</packaging>
    	<name>Fess Crawler Project</name>
    	<description>Fess Crawler is Crawler Framework.</description>
    	<url>https://github.com/codelibs/fess-crawler</url>
    	<issueManagement>
    		<system>GitHub</system>
    		<url>https://github.com/codelibs/fess-crawler/issues</url>
    	</issueManagement>
    	<scm>
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 2.2K bytes
    - Viewed (0)
  8. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlFilterService.java

     */
    package org.codelibs.fess.crawler.service.impl;
    
    import java.util.ArrayList;
    import java.util.HashSet;
    import java.util.List;
    import java.util.Set;
    import java.util.concurrent.ExecutionException;
    import java.util.concurrent.TimeUnit;
    import java.util.regex.Pattern;
    import java.util.stream.Collectors;
    
    import org.codelibs.fess.crawler.entity.OpenSearchUrlFilter;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 6.3K bytes
    - Viewed (0)
  9. fess-crawler-opensearch/src/test/resources/lasta_di.properties

    #smart.deploy.mode.location = maihama_env.properties: lasta_di.smart.deploy.mode
    
    # package for smart deploy target e.g. org.docksidestage.app
    smart.package1 = org.codelibs.fess.crawler
    
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 479 bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

    import org.codelibs.core.misc.Pair;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.builder.RequestDataBuilder;
    import org.codelibs.fess.crawler.container.CrawlerContainer;
    import org.codelibs.fess.crawler.entity.AccessResultData;
    import org.codelibs.fess.crawler.entity.RequestData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Oct 24 12:16:00 UTC 2024
    - 19.4K bytes
    - Viewed (0)
Back to top