Search Options

Results per page
Sort
Preferred Languages
Advance

Results 61 - 70 of 189 for crawler_ (0.29 sec)

  1. src/main/resources/crawler/extractor+tikaExtractor.xml

    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<component name="tikaExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.TikaExtractor">
    		<property name="maxCompressionRatio">2</property>
    		<property name="maxUncompressionSize">10000000</property>
    	</component>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sun Aug 25 12:46:12 UTC 2019
    - 461 bytes
    - Viewed (0)
  2. src/main/resources/crawler/contentlength.xml

    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    
    	<component name="contentLengthHelper"
    		class="org.codelibs.fess.crawler.helper.ContentLengthHelper" instance="singleton">
    		<property name="defaultMaxLength">10485760</property><!-- 10M -->
    		<postConstruct name="addMaxLength">
    			<arg>"text/html"</arg>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sun Oct 11 06:51:14 UTC 2015
    - 561 bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/opensearch/client/CrawlerEngineClient.java

    import org.codelibs.fess.Constants;
    import org.codelibs.fess.crawler.client.FesenClient;
    import org.codelibs.fess.mylasta.direction.FessConfig;
    import org.codelibs.fess.util.ComponentUtil;
    import org.opensearch.common.settings.Settings;
    import org.opensearch.common.settings.Settings.Builder;
    import org.opensearch.transport.client.Client;
    
    /**
     * OpenSearch client implementation specifically for crawler operations.
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/app/web/admin/webconfig/AdminWebconfigAction.java

         */
        @Execute
        @Secured({ ROLE, ROLE + VIEW })
        public HtmlResponse index(final SearchForm form) {
            return asListHtml();
        }
    
        /**
         * Displays a paginated list of web crawler configurations.
         *
         * @param pageNumber the page number to display (optional)
         * @param form the search form containing filter criteria
         * @return HTML response with the web config list
         */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 21K bytes
    - Viewed (0)
  5. src/main/webapp/WEB-INF/view/admin/scheduler/admin_scheduler_edit.jsp

                                            <la:errors property="crawler"/>
                                            <div class="form-check">
                                                <la:checkbox styleId="crawler" styleClass="form-check-input" property="crawler"/>
                                                <label for="crawler" class="form-check-label">
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Mon Jan 16 12:54:35 UTC 2023
    - 9.6K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/crawler/transformer/FessStandardTransformer.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.transformer;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    import org.codelibs.fess.exception.FessSystemException;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 3.8K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/helper/ProtocolHelper.java

    /**
     * Helper class for managing and validating URL protocols in Fess crawling system.
     * This class handles the initialization and validation of web and file protocols
     * used by the crawler to determine which URLs can be crawled.
     */
    public class ProtocolHelper {
        private static final Logger logger = LogManager.getLogger(ProtocolHelper.class);
    
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 9.7K bytes
    - Viewed (0)
  8. src/main/resources/fess_label_de.properties

    labels.crawling_info_delete_all_cancel=Abbrechen
    labels.crawling_info_thread_dump=Thread-Dump
    labels.crawling_info_CrawlerStartTime=Crawler-Startzeit
    labels.crawling_info_CrawlerEndTime=Crawler-Endzeit
    labels.crawling_info_CrawlerExecTime=Crawler-Ausführungszeit
    labels.crawling_info_CrawlerStatus=Crawler-Status
    labels.crawling_info_WebFsCrawlExecTime=Crawl-Ausführungszeit (Web/Datei)
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 10 04:56:21 UTC 2025
    - 43.5K bytes
    - Viewed (1)
  9. src/test/java/org/codelibs/fess/it/CrawlTestBase.java

                ThreadUtil.sleep(500);
                count++;
                final Map<String, Object> scheduler = getSchedulerItem(namePrefix);
                assertTrue(scheduler.containsKey("running"));
                isRunning = (Boolean) scheduler.get("running");
            }
            if (300 <= count) {
                logger.info("Time out: Failed to start crawler)");
                fail(); // Time Out
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 10K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/thumbnail/impl/BaseThumbnailGenerator.java

    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.core.misc.Tuple3;
    import org.codelibs.fess.crawler.builder.RequestDataBuilder;
    import org.codelibs.fess.crawler.client.CrawlerClient;
    import org.codelibs.fess.crawler.client.CrawlerClientFactory;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.codelibs.fess.exception.ThumbnailGenerationException;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 13.3K bytes
    - Viewed (0)
Back to top