Search Options

Results per page
Sort
Preferred Languages
Advance

Results 91 - 100 of 529 for crawlen (0.04 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapNews.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.entity;
    
    import java.io.Serializable;
    
    /**
     * Represents a news entry within a sitemap URL.
     * This class encapsulates the properties of a news article as defined in the Google News Sitemap extension.
     *
     * <p>
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 13 13:34:36 UTC 2025
    - 4.8K bytes
    - Viewed (0)
  2. src/main/resources/fess_message.properties

    success.crawling_info_delete_all = Deleted session data.
    success.start_crawl_process = Started a crawl process.
    success.upload_design_file = Updated {0}.
    success.update_design_jsp_file = Updated {0}.
    success.create_crawling_config_at_wizard = Created a crawling config {0}.
    success.failure_url_delete_all = Deleted failure URLs.
    success.delete_file = Deleted {0} file.
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Jul 05 02:36:47 UTC 2025
    - 11.6K bytes
    - Viewed (0)
  3. src/main/resources/fess_message_en.properties

    success.crawling_info_delete_all = Deleted session data.
    success.start_crawl_process = Started a crawl process.
    success.upload_design_file = Updated {0}.
    success.update_design_jsp_file = Updated {0}.
    success.create_crawling_config_at_wizard = Created a crawling config {0}.
    success.failure_url_delete_all = Deleted failure URLs.
    success.delete_file = Deleted {0} file.
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Jul 05 02:36:47 UTC 2025
    - 11.5K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

    import org.codelibs.core.misc.Pair;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.builder.RequestDataBuilder;
    import org.codelibs.fess.crawler.container.CrawlerContainer;
    import org.codelibs.fess.crawler.entity.AccessResultData;
    import org.codelibs.fess.crawler.entity.RequestData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Nov 29 07:42:33 UTC 2025
    - 30.5K bytes
    - Viewed (0)
  5. docs/fr/README.md

    * [LastaFlute](https://github.com/lastaflute/lastaflute "LastaFlute") : Framework Web
    * [Lasta Job](https://github.com/lastaflute/lasta-job "Lasta Job") : Planificateur de tâches
    * [Fess Crawler](https://github.com/codelibs/fess-crawler "Fess Crawler") : Crawler Web
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Tue Nov 11 22:42:32 UTC 2025
    - 7.9K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/CrawlerSystemException.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.exception;
    
    /**
     * The class CrawlerSystemException is a runtime exception that is thrown when a system error occurs during crawling.
     * It extends the RuntimeException class and provides constructors for creating exceptions with a message, a cause, or both.
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/crawler/transformer/AbstractFessFileTransformer.java

    import org.codelibs.fess.Constants;
    import org.codelibs.fess.crawler.entity.AccessResultData;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 25.7K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

        }
    
        /**
         * Gets the crawl delay value for the specified user agent from robots.txt.
         * The crawl delay specifies the time (in seconds) to wait between successive requests.
         *
         * @param userAgent The user agent string to match against robots.txt directives
         * @return The crawl delay value in seconds. Returns 0 if no matching directive is found
         *         or no crawl delay is specified for the matching directive.
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 18.5K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ResultData.java

     */
    package org.codelibs.fess.crawler.entity;
    
    import java.io.Serializable;
    import java.util.Collection;
    import java.util.LinkedHashSet;
    import java.util.Set;
    import java.util.function.Function;
    
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    
    /**
     * This class represents the result data of a crawl.
     */
    public class ResultData implements Serializable {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.7K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/interval/impl/HostIntervalControllerTest.java

    import java.util.concurrent.Future;
    
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.entity.UrlQueueImpl;
    import org.codelibs.fess.crawler.util.CrawlingParameterUtil;
    import org.dbflute.utflute.core.PlainTestCase;
    
    /**
     * @author hayato
     *
     */
    public class HostIntervalControllerTest extends PlainTestCase {
    
        /**
         * Test that crawling intervals for the same host work correctly.
         */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 11.4K bytes
    - Viewed (0)
Back to top