Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 54 for crawl (1.15 sec)

  1. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots_malformed.txt

    User-agent: GoodBot
    Disallow: /admin/
    InvalidDirective: some-value
    unknown-field: test
    Disallow /missing-colon
    Disallow:    # empty value (should be treated as allowing all)
    Allow: /public/
    Crawl-delay: invalid-number
    Crawl-delay: -10
    Crawl-delay: 5.5
    Crawl-delay:
    Allow:    # empty value
    
    # Case 3: Multiple colons in directive
    User-agent: MultiColonBot
    Disallow: http://example.com:8080/path
    Allow: /path:with:colons
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 14 12:52:01 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  2. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots.txt

    User-agent: FessCrawler
    Disallow:           # allows all 
    
    User-agent: BruteBot
    Disallow: /
    Allow: /foo/bar/
    Crawl-delay: 1314000
    
    # welcome!
    User-agent: Googlebot
    Crawl-delay: 1
    
    User-agent: *
    Disallow: /private/
    Disallow: /help        # disallows /help.html, /help/index.html, etc.
    Allow: /help/faq.html
    Crawl-delay: 3
    
    User-agent: Crawler
    Disallow: /aaa
    
    User-agent: Crawler/1.0
    Disallow: /bbb
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 566 bytes
    - Viewed (0)
  3. build-logic-commons/code-quality-rules/src/main/resources/checkstyle/checkstyle-api.xml

      ~ See the License for the specific language governing permissions and
      ~ limitations under the License.
      -->
    <!DOCTYPE module PUBLIC
            "-//Puppy Crawl//DTD Check Configuration 1.2//EN"
            "http://www.puppycrawl.com/dtds/configuration_1_2.dtd">
    <module name="Checker">
        <module name="SuppressionFilter">
            <property name="file" value="${config_loc}/suppressions.xml"/>
    Registered: Wed Dec 31 11:36:14 UTC 2025
    - Last Modified: Thu Nov 17 23:20:14 UTC 2022
    - 1.6K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/app/web/admin/fileconfig/CreateForm.java

        @Size(max = 200)
        public String name;
    
        /** The description of the file configuration (maximum 1000 characters). */
        @Size(max = 1000)
        public String description;
    
        /** The file paths to crawl (required, must be valid file URIs). */
        @Required
        @UriType(protocolType = ProtocolType.FILE)
        @CustomSize(maxKey = "form.admin.max.input.size")
        public String paths;
    
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 5.6K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java

         * command. Even though search engine crawlers may consider this information
         * when making decisions, they may crawl pages marked "hourly" less
         * frequently than that, and they may crawl pages marked "yearly" more
         * frequently than that. Crawlers may periodically crawl pages marked
         * "never" so that they can handle unexpected changes to those pages.
         */
        private String changefreq;
    
        /**
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 13 13:34:36 UTC 2025
    - 9.1K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/app/web/admin/dataconfig/EditForm.java

     * This form extends CreateForm to include fields necessary for updating existing data config entries,
     * including tracking information for optimistic locking and audit trails.
     * Data configs define how to crawl and extract data from databases, CSV files, and other data sources.
     *
     */
    public class EditForm extends CreateForm {
    
        /**
         * Creates a new EditForm instance.
         */
        public EditForm() {
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 2.3K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/app/web/api/admin/webconfig/SearchBody.java

        /**
         * Default constructor.
         */
        public SearchBody() {
            super();
        }
    
        /** Name of the web crawling configuration */
        public String name;
    
        /** URLs to crawl */
        public String urls;
    
        /** Description of the web crawling configuration */
        public String description;
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 1.2K bytes
    - Viewed (0)
  8. src/main/webapp/WEB-INF/view/admin/relatedquery/admin_relatedquery_edit.jsp

    <div class="wrapper">
        <jsp:include page="/WEB-INF/view/common/admin/header.jsp"></jsp:include>
        <jsp:include page="/WEB-INF/view/common/admin/sidebar.jsp">
            <jsp:param name="menuCategoryType" value="crawl"/>
            <jsp:param name="menuType" value="relatedQuery"/>
        </jsp:include>
        <main class="content-wrapper">
            <div class="content-header">
                <div class="container-fluid">
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Nov 13 05:54:52 UTC 2025
    - 4.8K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/app/web/admin/webconfig/EditForm.java

     * This form extends CreateForm to include fields necessary for updating existing web config entries,
     * including tracking information for optimistic locking and audit trails.
     * Web configs define how to crawl and index web sites and web applications.
     *
     */
    public class EditForm extends CreateForm {
    
        /**
         * Creates a new EditForm instance.
         */
        public EditForm() {
            super();
        }
    
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 2.3K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/app/web/admin/fileconfig/EditForm.java

     * This form extends CreateForm to include fields necessary for updating existing file config entries,
     * including tracking information for optimistic locking and audit trails.
     * File configs define how to crawl and index files from local file systems, SMB shares, and FTP servers.
     *
     */
    public class EditForm extends CreateForm {
    
        /**
         * Creates a new EditForm instance.
         */
        public EditForm() {
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 2.3K bytes
    - Viewed (0)
Back to top