Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 122 for crawled (0.12 sec)

  1. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                crawler1.getCrawlerContext().setMaxAccessCount(maxCount);
                crawler1.getCrawlerContext().setNumOfThread(numOfThread);
    
                Thread.sleep(100);
    
                final Crawler crawler2 = getComponent(Crawler.class);
                crawler2.setBackground(true);
                ((UrlFilterImpl) crawler2.urlFilter).setIncludeFilteringPattern("$1$2$3.*");
                crawler2.addUrl(url2);
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 7.7K bytes
    - Viewed (0)
  2. fess-crawler-opensearch/src/main/resources/crawler_opensearch.xml

    <components namespace="fessCrawler">
        <include path="crawler/container.xml"/>
        <include path="crawler/client.xml"/>
        <include path="crawler/rule.xml"/>
        <include path="crawler/filter.xml"/>
        <include path="crawler/interval.xml"/>
        <include path="crawler/extractor.xml"/>
        <include path="crawler/mimetype.xml"/>
        <include path="crawler/encoding.xml"/>
        <include path="crawler/urlconverter.xml"/>
        <include path="crawler/log.xml"/>
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 2.2K bytes
    - Viewed (0)
  3. pom.xml

    	<groupId>org.codelibs.fess</groupId>
    	<artifactId>fess-crawler-parent</artifactId>
    	<version>15.0.0-SNAPSHOT</version>
    	<packaging>pom</packaging>
    	<name>Fess Crawler Project</name>
    	<description>Fess Crawler is Crawler Framework.</description>
    	<url>https://github.com/codelibs/fess-crawler</url>
    	<issueManagement>
    		<system>GitHub</system>
    		<url>https://github.com/codelibs/fess-crawler/issues</url>
    	</issueManagement>
    	<scm>
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 2.2K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/UrlQueueImpl.java

        protected float weight = 1.0f;
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.entity.UrlQueue#getId()
         */
        @Override
        public IDTYPE getId() {
            return id;
        }
    
        /*
         * (non-Javadoc)
         *
         * @see org.codelibs.fess.crawler.entity.UrlQueue#setId(IDTYPE)
         */
        @Override
        public void setId(final IDTYPE id) {
            this.id = id;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Mon Nov 04 07:44:18 UTC 2024
    - 5.2K bytes
    - Viewed (0)
  5. fess-crawler-opensearch/pom.xml

    	<modelVersion>4.0.0</modelVersion>
    	<artifactId>fess-crawler-opensearch</artifactId>
    	<packaging>jar</packaging>
    	<name>Fess Crawler Elasticsearch</name>
    	<parent>
    		<groupId>org.codelibs.fess</groupId>
    		<artifactId>fess-crawler-parent</artifactId>
    		<version>15.0.0-SNAPSHOT</version>
    		<relativePath>../pom.xml</relativePath>
    	</parent>
    	<build>
    		<plugins>
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 3.4K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/helper/PluginHelper.java

            if (artifactType != ArtifactType.CRAWLER) {
                return false;
            }
    
            if ("fess-crawler".equals(name)//
                    || "fess-crawler-db".equals(name)//
                    || "fess-crawler-db-h2".equals(name)//
                    || "fess-crawler-db-mysql".equals(name)//
                    || "fess-crawler-es".equals(name)//
                    || "fess-crawler-lasta".equals(name)//
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Oct 24 01:47:10 UTC 2024
    - 17.8K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

    import org.codelibs.core.misc.Pair;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.builder.RequestDataBuilder;
    import org.codelibs.fess.crawler.container.CrawlerContainer;
    import org.codelibs.fess.crawler.entity.AccessResultData;
    import org.codelibs.fess.crawler.entity.RequestData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Oct 24 12:16:00 UTC 2024
    - 19.4K bytes
    - Viewed (0)
  8. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/util/OpenSearchCrawlerConfig.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.util;
    
    public class OpenSearchCrawlerConfig {
        protected String queueIndex = ".crawler.queue";
    
        protected String dataIndex = ".crawler.data";
    
        protected String filterIndex = ".crawler.filter";
    
        protected int queueShards = Runtime.getRuntime().availableProcessors() * 2;
    
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 2.7K bytes
    - Viewed (0)
  9. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueService.java

    import org.codelibs.fess.crawler.entity.OpenSearchUrlQueue;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.exception.OpenSearchAccessException;
    import org.codelibs.fess.crawler.service.UrlQueueService;
    import org.codelibs.fess.crawler.util.OpenSearchCrawlerConfig;
    import org.opensearch.action.DocWriteRequest.OpType;
    import org.opensearch.action.bulk.BulkRequestBuilder;
    import org.opensearch.action.bulk.BulkResponse;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 13.4K bytes
    - Viewed (0)
  10. deps.xml

    <project name="deps" basedir=".">
    	<property name="target.dir" value="${basedir}/target/deps" />
    	<property name="webinf.dir" value="${basedir}/src/main/webapp/WEB-INF" />
    	<property name="crawler.dir" value="${basedir}/src/main/webapp/WEB-INF/env/crawler" />
    	<property name="suggest.dir" value="${basedir}/src/main/webapp/WEB-INF/env/suggest" />
    	<property name="thumbnail.dir" value="${basedir}/src/main/webapp/WEB-INF/env/thumbnail" />
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Oct 24 04:37:19 UTC 2024
    - 2.5K bytes
    - Viewed (0)
Back to top