Search Options

Results per page
Sort
Preferred Languages
Advance

Results 151 - 160 of 538 for crawlers (0.06 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/FilenameExtractor.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.InputStream;
    import java.util.Map;
    
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * @author shinsuke
     *
     */
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 1.5K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/FileTransformer.java

     */
    package org.codelibs.fess.crawler.transformer.impl;
    
    import java.io.File;
    import java.io.FileOutputStream;
    import java.io.IOException;
    import java.io.InputStream;
    import java.io.OutputStream;
    import java.io.UnsupportedEncodingException;
    
    import org.codelibs.core.io.CopyUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.AccessResultData;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 7.8K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/ResponseDataUtil.java

     */
    package org.codelibs.fess.crawler.util;
    
    import java.io.File;
    import java.io.FileOutputStream;
    import java.io.InputStream;
    
    import org.codelibs.core.io.CloseableUtil;
    import org.codelibs.core.io.CopyUtil;
    import org.codelibs.core.io.FileUtil;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    
    /**
     * @author shinsuke
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 1.8K bytes
    - Viewed (0)
  4. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueService.java

    import org.codelibs.fess.crawler.entity.OpenSearchUrlQueue;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.exception.OpenSearchAccessException;
    import org.codelibs.fess.crawler.service.UrlQueueService;
    import org.codelibs.fess.crawler.util.OpenSearchCrawlerConfig;
    import org.opensearch.action.DocWriteRequest.OpType;
    import org.opensearch.action.bulk.BulkRequestBuilder;
    import org.opensearch.action.bulk.BulkResponse;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 13.4K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/es/config/bsentity/dbmeta/ScheduledJobDbm.java

                false, "Boolean", 0, 0, null, null, false, null, null, null, null, null, false);
        protected final ColumnInfo _columnCrawler = cci("crawler", "crawler", null, null, Boolean.class, "crawler", null, false, false, false,
                "Boolean", 0, 0, null, null, false, null, null, null, null, null, false);
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Feb 22 01:37:57 UTC 2024
    - 13.3K bytes
    - Viewed (0)
  6. cmd/streaming-v4-unsigned.go

    	if trailer {
    		// Discard anything unsigned.
    		req.Trailer = make(http.Header)
    		trailers := req.Header.Values(awsTrailerHeader)
    		for _, key := range trailers {
    			req.Trailer.Add(key, "")
    		}
    	} else {
    		req.Trailer = nil
    	}
    	return &s3UnsignedChunkedReader{
    		trailers: req.Trailer,
    		reader:   bufio.NewReader(req.Body),
    		buffer:   make([]byte, 64*1024),
    	}, ErrNone
    }
    
    Registered: Sun Nov 03 19:28:11 UTC 2024
    - Last Modified: Sat May 06 02:53:12 UTC 2023
    - 6.1K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/interval/impl/HostIntervalControllerTest.java

     */
    package org.codelibs.fess.crawler.interval.impl;
    
    import java.util.ArrayList;
    import java.util.List;
    import java.util.concurrent.Callable;
    import java.util.concurrent.ExecutionException;
    import java.util.concurrent.ExecutorService;
    import java.util.concurrent.Executors;
    import java.util.concurrent.Future;
    
    import org.codelibs.fess.crawler.entity.UrlQueue;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 3.2K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

    import java.util.regex.Pattern;
    
    import org.apache.commons.io.input.BOMInputStream;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.RobotsTxt;
    import org.codelibs.fess.crawler.entity.RobotsTxt.Directive;
    import org.codelibs.fess.crawler.exception.RobotsTxtException;
    
    /**
     * Robots.txt Specifications:
     * <ul>
     * <li><a href=
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sat Oct 12 01:40:57 UTC 2024
    - 6.1K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/ChildUrlsException.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.exception;
    
    import java.util.Set;
    
    import org.codelibs.fess.crawler.entity.RequestData;
    
    /**
     * ChildUrlsException is thrown when having child urls.
     *
     * @author shinsuke
     *
     */
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 1.3K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/XmlUtil.java

     */
    package org.codelibs.fess.crawler.util;
    
    import java.io.ByteArrayInputStream;
    import java.util.ArrayList;
    import java.util.HashMap;
    import java.util.List;
    import java.util.Map;
    
    import javax.xml.XMLConstants;
    import javax.xml.parsers.SAXParser;
    import javax.xml.parsers.SAXParserFactory;
    
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.Constants;
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 6.1K bytes
    - Viewed (0)
Back to top