Search Options

Results per page
Sort
Preferred Languages
Advance

Results 81 - 90 of 470 for Crawler (0.03 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractor.java

    import org.codelibs.core.timer.TimeoutTask;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.client.AccessTimeoutTarget;
    import org.codelibs.fess.crawler.client.http.Authentication;
    import org.codelibs.fess.crawler.client.http.RequestHeader;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    import com.google.common.base.Charsets;
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 12.2K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/FileTransformerTest.java

     */
    package org.codelibs.fess.crawler.transformer.impl;
    
    import java.io.File;
    import java.io.IOException;
    import java.util.Map;
    
    import org.codelibs.core.io.FileUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.AccessResultDataImpl;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 7.6K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractorTest.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.IOException;
    import java.io.InputStream;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.ResourceUtil;
    import org.codelibs.fess.crawler.container.StandardCrawlerContainer;
    import org.codelibs.fess.crawler.entity.ExtractData;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 4.6K bytes
    - Viewed (1)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/XmlUtil.java

     *   <li>org.codelibs.fess.crawler.Constants</li>
     *   <li>org.codelibs.fess.crawler.exception.CrawlerSystemException</li>
     *   <li>org.codelibs.fess.crawler.entity.AccessResultData</li>
     *   <li>org.codelibs.core.lang.StringUtil</li>
     * </ul>
     *
     * @see org.codelibs.fess.crawler.Constants
     * @see org.codelibs.fess.crawler.exception.CrawlerSystemException
     * @see org.codelibs.fess.crawler.entity.AccessResultData
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Nov 22 13:28:22 UTC 2025
    - 9.5K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/container/CrawlerContainer.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.container;
    
    import org.codelibs.core.lang.StringUtil;
    
    /**
     * The CrawlerContainer interface provides methods for managing components
     * within a crawler container. It includes methods to retrieve components,
     * check availability, and destroy the container. Additionally, it provides
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapFile.java

         * Datetime format.
         *
         * By providing the last modification timestamp, you enable search engine
         * crawlers to retrieve only a subset of the Sitemaps in the index i.e. a
         * crawler may only retrieve Sitemaps that were modified since a certain
         * date. This incremental Sitemap fetching mechanism allows for the rapid
         * discovery of new URLs on very large sites.
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.4K bytes
    - Viewed (1)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/CrawlerLoginFailureException.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.exception;
    
    /**
     * The crawler login failure exception.
     * This exception is thrown when the crawler fails to login to a website.
     *
     */
    public class CrawlerLoginFailureException extends CrawlerSystemException {
        private static final long serialVersionUID = 1L;
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.1K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractorTest.java

    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    import org.codelibs.fess.crawler.helper.impl.MimeTypeHelperImpl;
    import org.dbflute.utflute.core.PlainTestCase;
    
    /**
     * @author shinsuke
     *
     */
    public class PdfExtractorTest extends PlainTestCase {
        private static final Logger logger = LogManager.getLogger(PdfExtractorTest.class);
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 7.6K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/UrlFilterServiceImpl.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.service.impl;
    
    import java.util.List;
    import java.util.regex.Pattern;
    
    import org.codelibs.fess.crawler.helper.MemoryDataHelper;
    import org.codelibs.fess.crawler.service.UrlFilterService;
    
    import jakarta.annotation.Resource;
    
    /**
     * Implementation of the {@link UrlFilterService} interface.
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  10. fess-crawler-lasta/src/main/resources/crawler/rule.xml

    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<include path="crawler/transformer.xml" />
    
    	<component name="ruleManager"
    		class="org.codelibs.fess.crawler.rule.impl.RuleManagerImpl" instance="prototype">
    		<postConstruct name="addRule">
    			<arg>sitemapsRule</arg>
    		</postConstruct>
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 1.5K bytes
    - Viewed (0)
Back to top