Search Options

Results per page
Sort
Preferred Languages
Advance

Results 111 - 120 of 658 for crawler (0.23 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/IntervalController.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.interval;
    
    /**
     * The {@code IntervalController} interface defines methods for controlling
     * the delay intervals in a web crawler. It includes constants representing
     * different types of processing states and a method to introduce a delay
     * based on the type of processing.
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.8K bytes
    - Viewed (0)
  2. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlFilterService.java

     */
    package org.codelibs.fess.crawler.service.impl;
    
    import java.util.ArrayList;
    import java.util.HashSet;
    import java.util.List;
    import java.util.Set;
    import java.util.concurrent.ExecutionException;
    import java.util.concurrent.TimeUnit;
    import java.util.regex.Pattern;
    import java.util.stream.Collectors;
    
    import org.codelibs.fess.crawler.entity.OpenSearchUrlFilter;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/LogHelperImpl.java

     */
    package org.codelibs.fess.crawler.helper.impl;
    
    import java.util.Set;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.entity.RequestData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/SitemapsException.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.exception;
    
    /**
     * Exception thrown during sitemaps processing in the crawler.
     * This exception extends {@link org.codelibs.fess.crawler.exception.CrawlerSystemException}
     * and provides constructors for wrapping other exceptions or creating a new exception with a message.
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.7K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/smb1/SmbClientTest.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.client.smb1;
    
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.dbflute.utflute.core.PlainTestCase;
    
    /**
     * @author shinsuke
     *
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 2.3K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/RuleManagerImplTest.java

     */
    package org.codelibs.fess.crawler.rule.impl;
    
    import java.io.File;
    
    import org.codelibs.core.io.CloseableUtil;
    import org.codelibs.core.io.ResourceUtil;
    import org.codelibs.fess.crawler.container.StandardCrawlerContainer;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.helper.SitemapsHelper;
    import org.codelibs.fess.crawler.rule.Rule;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.2K bytes
    - Viewed (0)
  7. src/main/resources/crawler/interval.xml

    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    
    	<component name="intervalController"
    		class="org.codelibs.fess.crawler.interval.FessIntervalController"
    		instance="prototype">
    	</component>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sun Oct 11 06:51:14 UTC 2015
    - 381 bytes
    - Viewed (0)
  8. fess-crawler-lasta/src/main/resources/crawler/filter.xml

    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    
    	<component name="urlFilter"
    		class="org.codelibs.fess.crawler.filter.impl.UrlFilterImpl" instance="prototype">
    	</component>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 364 bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/RegexRule.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.rule.impl;
    
    import java.util.HashMap;
    import java.util.Map;
    import java.util.regex.Matcher;
    import java.util.regex.Pattern;
    
    import org.codelibs.core.beans.util.BeanUtil;
    import org.codelibs.core.beans.util.CopyOptions;
    import org.codelibs.fess.crawler.entity.ResponseData;
    
    /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.2K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/crawler/transformer/AbstractFessFileTransformer.java

    import org.codelibs.fess.Constants;
    import org.codelibs.fess.crawler.entity.AccessResultData;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 25.6K bytes
    - Viewed (0)
Back to top