Search Options

Results per page
Sort
Preferred Languages
Advance

Results 131 - 140 of 915 for crawled (0.04 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/XmlExtractorTest.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.BufferedInputStream;
    import java.io.ByteArrayInputStream;
    import java.io.InputStream;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.CloseableUtil;
    import org.codelibs.core.io.ResourceUtil;
    import org.codelibs.fess.crawler.container.StandardCrawlerContainer;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.4K bytes
    - Viewed (0)
  2. fess-crawler-lasta/src/main/resources/crawler/client.xml

    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<include path="crawler/robotstxt.xml" />
    	<include path="crawler/contentlength.xml" />
    	<include path="crawler/mimetype.xml" />
    
    	<component name="internalHttpClient" class="org.codelibs.fess.crawler.client.http.HcHttpClient"
    		instance="prototype">
    		<property name="connectionTimeout">15000</property>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Tue Aug 08 12:54:47 UTC 2023
    - 2.8K bytes
    - Viewed (0)
  3. pom.xml

    	<modelVersion>4.0.0</modelVersion>
    	<groupId>org.codelibs.fess</groupId>
    	<artifactId>fess-crawler-parent</artifactId>
    	<version>15.3.0-SNAPSHOT</version>
    	<packaging>pom</packaging>
    	<name>Fess Crawler Project</name>
    	<description>Fess Crawler is Crawler Framework.</description>
    	<url>https://github.com/codelibs/fess-crawler</url>
    	<inceptionYear>2009</inceptionYear>
    	<licenses>
    		<license>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 2.8K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/Extractor.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor;
    
    import java.io.InputStream;
    import java.util.Map;
    
    import org.codelibs.fess.crawler.entity.ExtractData;
    
    /**
     * The Extractor interface defines methods for extracting text data from an input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.6K bytes
    - Viewed (0)
  5. src/test/java/org/codelibs/fess/helper/IntervalControlHelperTest.java

            helper.setCrawlerWaitMillis(50);
    
            // Test when crawler is running
            assertTrue(helper.isCrawlerRunning());
            long start = System.currentTimeMillis();
            helper.checkCrawlerStatus();
            long end = System.currentTimeMillis();
            assertTrue(end - start < 100); // Should return quickly
    
            // Test when crawler is not running
            helper.setCrawlerRunning(false);
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 10 13:41:04 UTC 2025
    - 13.1K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractorTest.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.InputStream;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.CloseableUtil;
    import org.codelibs.core.io.ResourceUtil;
    import org.codelibs.fess.crawler.container.StandardCrawlerContainer;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 2.1K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClient.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.client;
    
    import java.util.Map;
    
    import org.codelibs.fess.crawler.entity.RequestData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    
    /**
     * Interface representing a client for a web crawler.
     * This client is responsible for executing requests and handling responses.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.8K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/helper/DocumentHelper.java

    import org.codelibs.fess.Constants;
    import org.codelibs.fess.crawler.builder.RequestDataBuilder;
    import org.codelibs.fess.crawler.client.CrawlerClient;
    import org.codelibs.fess.crawler.client.CrawlerClientFactory;
    import org.codelibs.fess.crawler.entity.RequestData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    import org.codelibs.fess.crawler.exception.ChildUrlsException;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 17.2K bytes
    - Viewed (0)
  9. src/test/java/org/codelibs/fess/helper/CrawlingInfoHelperTest.java

                    return existingInfo;
                }
    
                @Override
                public void store(CrawlingInfo entity) {
                    // Should not be called for existing info
                    fail("Store should not be called for existing info");
                }
    
                @Override
                public void storeInfo(List<CrawlingInfoParam> crawlingInfoParamList) {
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sat Jul 12 05:35:01 UTC 2025
    - 26.6K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformerTest.java

     */
    package org.codelibs.fess.crawler.transformer.impl;
    
    import java.util.ArrayList;
    import java.util.List;
    import java.util.Map;
    
    import org.codelibs.core.io.ResourceUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.AccessResultDataImpl;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 13.5K bytes
    - Viewed (0)
Back to top