Search Options

Results per page
Sort
Preferred Languages
Advance

Results 21 - 30 of 34 for fess_crawler (0.26 sec)

  1. fess-crawler-lasta/src/main/resources/crawler/mimetype.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    
    	<component name="mimeTypeHelper"
    		class="org.codelibs.fess.crawler.helper.impl.MimeTypeHelperImpl" instance="singleton">
    	</component>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 374 bytes
    - Viewed (0)
  2. fess-crawler-lasta/src/main/resources/crawler/sitemaps.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    
    	<component name="sitemapsHelper" class="org.codelibs.fess.crawler.helper.SitemapsHelper"
    		instance="singleton">
    	</component>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 365 bytes
    - Viewed (0)
  3. fess-crawler-lasta/src/main/resources/crawler/urlconverter.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    
    	<!-- Converts child links to normalize it. -->
    	<component name="urlConvertHelper" class="org.codelibs.fess.crawler.helper.UrlConvertHelper">
    	</component>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 394 bytes
    - Viewed (0)
  4. src/main/resources/crawler/extractor+tikaExtractor.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<component name="tikaExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.TikaExtractor">
    		<property name="maxCompressionRatio">2</property>
    		<property name="maxUncompressionSize">10000000</property>
    	</component>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sun Aug 25 12:46:12 UTC 2019
    - 461 bytes
    - Viewed (0)
  5. src/main/resources/crawler/rule.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<include path="crawler/transformer.xml" />
    
    	<component name="ruleManager" class="org.codelibs.fess.crawler.rule.impl.RuleManagerImpl" instance="prototype">
    		<postConstruct name="addRule">
    			<arg>sitemapsRule</arg>
    		</postConstruct>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jun 04 08:42:49 UTC 2020
    - 4.6K bytes
    - Viewed (0)
  6. src/main/resources/crawler/contentlength.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    
    	<component name="contentLengthHelper"
    		class="org.codelibs.fess.crawler.helper.ContentLengthHelper" instance="singleton">
    		<property name="defaultMaxLength">10485760</property><!-- 10M -->
    		<postConstruct name="addMaxLength">
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sun Oct 11 06:51:14 UTC 2015
    - 561 bytes
    - Viewed (0)
  7. fess-crawler-lasta/src/main/resources/crawler/robotstxt.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    
    	<component name="robotsTxtHelper" class="org.codelibs.fess.crawler.helper.RobotsTxtHelper"
    		instance="prototype">
    	</component>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 367 bytes
    - Viewed (0)
  8. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots.txt

    User-agent: FessCrawler
    Disallow:           # allows all 
    
    User-agent: BruteBot
    Disallow: /
    Allow: /foo/bar/
    Crawl-delay: 1314000
    
    # welcome!
    User-agent: Googlebot
    Crawl-delay: 1
    
    User-agent: *
    Disallow: /private/
    Disallow: /help        # disallows /help.html, /help/index.html, etc.
    Allow: /help/faq.html
    Crawl-delay: 3
    
    User-agent: Crawler
    Disallow: /aaa
    
    User-agent: Crawler/1.0
    Disallow: /bbb
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 566 bytes
    - Viewed (0)
  9. fess-crawler-lasta/src/main/resources/crawler/client.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<include path="crawler/robotstxt.xml" />
    	<include path="crawler/contentlength.xml" />
    	<include path="crawler/mimetype.xml" />
    
    	<component name="internalHttpClient" class="org.codelibs.fess.crawler.client.http.HcHttpClient"
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Tue Aug 08 12:54:47 UTC 2023
    - 2.8K bytes
    - Viewed (0)
  10. src/main/resources/crawler/transformer.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/transformer_basic.xml"/>
    
    	<component name="fessXpathTransformer" class="org.codelibs.fess.crawler.transformer.FessXpathTransformer" instance="singleton">
    		<property name="name">"fessXpathTransformer"</property>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Fri Dec 20 13:14:54 UTC 2024
    - 1.7K bytes
    - Viewed (0)
Back to top