Search Options

Results per page
Sort
Preferred Languages
Advance

Results 31 - 40 of 651 for crawler (0.32 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsExcelExtractor.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.IOException;
    import java.io.InputStream;
    import java.util.Map;
    
    import org.apache.poi.hssf.usermodel.HSSFWorkbook;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from .xls file.
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 1.8K bytes
    - Viewed (0)
  2. README.md

    * [LastaFlute](https://github.com/lastaflute/lastaflute "LastaFlute"): Web Framework
    * [Lasta Job](https://github.com/lastaflute/lasta-job "Lasta Job"): Job Scheduler
    * [Fess Crawler](https://github.com/codelibs/fess-crawler "Fess Crawler"): Web Crawler
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Sat Oct 12 07:19:47 UTC 2024
    - 7.3K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/crawler/processor/FessResponseProcessor.java

     */
    package org.codelibs.fess.crawler.processor;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.entity.AccessResult;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    import org.codelibs.fess.crawler.processor.impl.DefaultResponseProcessor;
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Feb 22 01:53:18 UTC 2024
    - 2.3K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/impl/AuthenticationImpl.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.client.http.impl;
    
    import org.apache.http.auth.AuthScheme;
    import org.apache.http.auth.AuthScope;
    import org.apache.http.auth.Credentials;
    import org.codelibs.fess.crawler.client.http.Authentication;
    
    /**
     * @author shinsuke
     *
     */
    public class AuthenticationImpl implements Authentication {
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 2.3K bytes
    - Viewed (0)
  5. fess-crawler-opensearch/src/main/resources/crawler_opensearch.xml

    <components namespace="fessCrawler">
        <include path="crawler/container.xml"/>
        <include path="crawler/client.xml"/>
        <include path="crawler/rule.xml"/>
        <include path="crawler/filter.xml"/>
        <include path="crawler/interval.xml"/>
        <include path="crawler/extractor.xml"/>
        <include path="crawler/mimetype.xml"/>
        <include path="crawler/encoding.xml"/>
        <include path="crawler/urlconverter.xml"/>
        <include path="crawler/log.xml"/>
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 2.2K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/HostIntervalController.java

    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.core.lang.SystemUtil;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.util.CrawlingParameterUtil;
    
    public class HostIntervalController extends DefaultIntervalController {
    
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 3K bytes
    - Viewed (0)
  7. src/test/resources/plugin/repo1/index.html

    <a href="fess-crawler-es/" title="fess-crawler-es/">fess-crawler-es/</a>                                                 -         -      
    <a href="fess-crawler-lasta/" title="fess-crawler-lasta/">fess-crawler-lasta/</a>                                              -         -      
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Tue Aug 13 07:34:14 UTC 2019
    - 3.3K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/es/config/bsentity/BsScheduledJob.java

            this.available = value;
        }
    
        public Boolean getCrawler() {
            checkSpecifiedProperty("crawler");
            return crawler;
        }
    
        public void setCrawler(Boolean value) {
            registerModifiedProperty("crawler");
            this.crawler = value;
        }
    
        public String getCreatedBy() {
            checkSpecifiedProperty("createdBy");
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Feb 22 01:37:57 UTC 2024
    - 9.3K bytes
    - Viewed (0)
  9. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/FaultTolerantClientTest.java

     */
    package org.codelibs.fess.crawler.client;
    
    import java.util.List;
    import java.util.Map;
    
    import org.codelibs.core.lang.SystemUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.builder.RequestDataBuilder;
    import org.codelibs.fess.crawler.client.FaultTolerantClient.RequestListener;
    import org.codelibs.fess.crawler.entity.RequestData;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 15.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractor.java

    import org.codelibs.core.timer.TimeoutTask;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.client.AccessTimeoutTarget;
    import org.codelibs.fess.crawler.client.http.Authentication;
    import org.codelibs.fess.crawler.client.http.RequestHeader;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.ExtractException;
    import org.slf4j.Logger;
    import org.slf4j.LoggerFactory;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:47:32 UTC 2024
    - 10K bytes
    - Viewed (0)
Back to top