Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 16 for doctype (0.04 sec)

  1. fess-crawler-opensearch/src/test/resources/app.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" 
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components>
        <include path="crawler_opensearch.xml"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 216 bytes
    - Viewed (0)
  2. fess-crawler-opensearch/src/main/resources/crawler/opensearch.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" 
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<component name="esClient"
    		class="org.codelibs.fess.crawler.client.FesenClient">
    	</component>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 293 bytes
    - Viewed (1)
  3. fess-crawler-lasta/src/main/resources/crawler/client.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<include path="crawler/robotstxt.xml" />
    	<include path="crawler/contentlength.xml" />
    	<include path="crawler/mimetype.xml" />
    
    	<component name="internalHttpClient" class="org.codelibs.fess.crawler.client.http.HcHttpClient"
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Tue Aug 08 12:54:47 UTC 2023
    - 2.8K bytes
    - Viewed (0)
  4. fess-crawler-opensearch/src/main/resources/crawler_opensearch.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" 
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
        <include path="crawler/container.xml"/>
        <include path="crawler/client.xml"/>
        <include path="crawler/rule.xml"/>
        <include path="crawler/filter.xml"/>
        <include path="crawler/interval.xml"/>
        <include path="crawler/extractor.xml"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 2.2K bytes
    - Viewed (0)
  5. README.md

    ### XML Configuration
    
    Fess Crawler uses XML-based configuration with LastaFlute DI. Place configuration files in your classpath:
    
    ```xml
    <!-- crawler.xml -->
    <?xml version="1.0" encoding="UTF-8"?>
    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
        "http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
        <component name="crawler" class="org.codelibs.fess.crawler.Crawler" instance="prototype"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/log/LogType.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.log;
    
    /**
     * LogType defines the different types of log messages that can be generated during the crawling process.
     * Each enum constant represents a specific event or state in the crawler's execution.
     */
    public enum LogType {
        /** Indicates the start of a crawling process. */
        START_CRAWLING,
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.4K bytes
    - Viewed (0)
  7. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

        <!--  files which contain HTML within them, eg mime emails -->
        <magic priority="40">
          <match value="&lt;!DOCTYPE HTML" type="string" offset="0:64"/>
          <match value="&lt;!DOCTYPE html" type="string" offset="0:64"/>
          <match value="&lt;!doctype HTML" type="string" offset="0:64"/>
          <match value="&lt;!doctype html" type="string" offset="0:64"/>
          <match value="&lt;HEAD" type="string" offset="0:64"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

        }
    
        /**
         * Logs a message using the provided LogHelper.
         * @param logHelper The LogHelper instance.
         * @param key The LogType key.
         * @param objs The objects to log.
         */
        protected void log(final LogHelper logHelper, final LogType key, final Object... objs) {
            if (logHelper != null) {
                logHelper.log(key, objs);
            }
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/LogHelper.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.helper;
    
    import org.codelibs.fess.crawler.log.LogType;
    
    /**
     * Interface for logging helper.
     * Provides a method to log messages with a specified log type and additional objects.
     */
    public interface LogHelper {
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.1K bytes
    - Viewed (0)
  10. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlFilterService.java

    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.service.UrlFilterService;
    import org.codelibs.fess.crawler.util.OpenSearchCrawlerConfig;
    import org.opensearch.action.DocWriteRequest.OpType;
    import org.opensearch.index.query.QueryBuilders;
    
    import com.google.common.cache.CacheBuilder;
    import com.google.common.cache.CacheLoader;
    import com.google.common.cache.LoadingCache;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 9.2K bytes
    - Viewed (0)
Back to top