Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 22 for crawl (0.03 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

    import org.codelibs.fess.crawler.exception.RobotsTxtException;
    
    /**
     * Robots.txt Specifications:
     * <ul>
     * <li><a href=
     * "https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt"
     * >https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt
     * </a></li>
     * </ul>
     *
     * @author bowez
     * @author shinsuke
     *
     */
    public class RobotsTxtHelper {
    
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sat Oct 12 01:40:57 UTC 2024
    - 6.1K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/exec/Crawler.java

                    webFsCrawlerThread = new Thread((Runnable) () -> {
                        // crawl web
                        writeTimeToSessionInfo(crawlingInfoHelper, Constants.WEB_FS_CRAWLER_START_TIME);
                        webFsIndexHelper.crawl(options.sessionId, webConfigIdList, fileConfigIdList);
                        writeTimeToSessionInfo(crawlingInfoHelper, Constants.WEB_FS_CRAWLER_END_TIME);
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri Oct 11 21:20:39 UTC 2024
    - 24K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java

         * command. Even though search engine crawlers may consider this information
         * when making decisions, they may crawl pages marked "hourly" less
         * frequently than that, and they may crawl pages marked "yearly" more
         * frequently than that. Crawlers may periodically crawl pages marked
         * "never" so that they can handle unexpected changes to those pages.
         */
        private String changefreq;
    
        /**
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 4.9K bytes
    - Viewed (0)
  4. build-logic-commons/code-quality-rules/src/main/resources/checkstyle/checkstyle-api.xml

      ~ See the License for the specific language governing permissions and
      ~ limitations under the License.
      -->
    <!DOCTYPE module PUBLIC
            "-//Puppy Crawl//DTD Check Configuration 1.2//EN"
            "http://www.puppycrawl.com/dtds/configuration_1_2.dtd">
    <module name="Checker">
        <module name="SuppressionFilter">
            <property name="file" value="${config_loc}/suppressions.xml"/>
    Registered: Wed Nov 06 11:36:14 UTC 2024
    - Last Modified: Thu Nov 17 23:20:14 UTC 2022
    - 1.6K bytes
    - Viewed (0)
  5. src/main/resources/fess_label_de.properties

    labels.crawling_info_CrawlerExecTime=Crawler Ausführungsdauer
    labels.crawling_info_CrawlerStatus=Crawler-Status
    labels.crawling_info_WebFsCrawlExecTime=Crawl Ausführungsdauer (Web/Dateisystem)
    labels.crawling_info_WebFsCrawlStartTime=Crawl Startzeit (Web/Dateisystem)
    labels.crawling_info_WebFsCrawlEndTime=Crawl Endzeit (Web/Dateisystem)
    labels.crawling_info_WebFsIndexExecTime=Indizierung Ausführungsdauer (Web/Dateisystem)
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri Mar 22 11:58:34 UTC 2024
    - 42.8K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/helper/DataIndexHelper.java

        protected int crawlerPriority = Thread.NORM_PRIORITY;
    
        protected final List<DataCrawlingThread> dataCrawlingThreadList = Collections.synchronizedList(new ArrayList<>());
    
        public void crawl(final String sessionId) {
            final List<DataConfig> configList = ComponentUtil.getCrawlingConfigHelper().getAllDataConfigList();
    
            if (configList.isEmpty()) {
                // nothing
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Feb 22 01:37:57 UTC 2024
    - 12K bytes
    - Viewed (0)
  7. src/main/resources/fess_label_en.properties

    labels.crawling_info_WebFsCrawlExecTime=Crawl exec time (Web/File system)
    labels.crawling_info_WebFsCrawlStartTime=Crawl start time (Web/File system)
    labels.crawling_info_WebFsCrawlEndTime=Crawl end time (Web/File system)
    labels.crawling_info_WebFsIndexExecTime=Indexing exec time (Web/File system)
    labels.crawling_info_WebFsIndexSize=Index size (Web/File system)
    labels.crawling_info_DataCrawlExecTime=Crawl exec time (Data store)
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri Mar 22 11:58:34 UTC 2024
    - 40.7K bytes
    - Viewed (0)
  8. src/main/resources/fess_message_ru.properties

    errors.login_error=Username or Password is not correct.
    errors.sso_login_error=Failed to process SSO login.
    errors.could_not_find_log_file=Could not find {0}.
    errors.failed_to_start_crawl_process=Failed to start a crawl process.
    errors.invalid_design_jsp_file_name=Invalid JSP file.
    errors.design_jsp_file_does_not_exist=JSP file does not exist.
    errors.design_file_name_is_not_found=The file name is not specified.
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri May 20 12:12:28 UTC 2022
    - 10.2K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/helper/WebFsIndexHelper.java

        protected int crawlerPriority = Thread.NORM_PRIORITY;
    
        protected final List<Crawler> crawlerList = Collections.synchronizedList(new ArrayList<>());
    
        public void crawl(final String sessionId, final List<String> webConfigIdList, final List<String> fileConfigIdList) {
            final boolean runAll = webConfigIdList == null && fileConfigIdList == null;
            final List<WebConfig> webConfigList;
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri Oct 11 21:11:58 UTC 2024
    - 22.6K bytes
    - Viewed (0)
  10. src/main/resources/fess_label.properties

    labels.crawling_info_WebFsCrawlExecTime=Crawl exec time (Web/File system)
    labels.crawling_info_WebFsCrawlStartTime=Crawl start time (Web/File system)
    labels.crawling_info_WebFsCrawlEndTime=Crawl end time (Web/File system)
    labels.crawling_info_WebFsIndexExecTime=Indexing exec time (Web/File system)
    labels.crawling_info_WebFsIndexSize=Index size (Web/File system)
    labels.crawling_info_DataCrawlExecTime=Crawl exec time (Data store)
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri Mar 22 11:58:34 UTC 2024
    - 40.7K bytes
    - Viewed (0)
Back to top