Search Options

Results per page
Sort
Preferred Languages
Advance

Results 31 - 40 of 46 for parent (0.02 sec)

  1. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots.txt

    User-agent: FessCrawler
    Disallow:           # allows all 
    
    User-agent: BruteBot
    Disallow: /
    Allow: /foo/bar/
    Crawl-delay: 1314000
    
    # welcome!
    User-agent: Googlebot
    Crawl-delay: 1
    
    User-agent: *
    Disallow: /private/
    Disallow: /help        # disallows /help.html, /help/index.html, etc.
    Allow: /help/faq.html
    Crawl-delay: 3
    
    User-agent: Crawler
    Disallow: /aaa
    
    User-agent: Crawler/1.0
    Disallow: /bbb
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 566 bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

     * </a></li>
     * </ul>
     *
     * @author bowez
     * @author shinsuke
     *
     */
    public class RobotsTxtHelper {
    
        /** Pattern for parsing user-agent records. */
        protected static final Pattern USER_AGENT_RECORD =
                Pattern.compile("^user-agent:\\s*([^\\t\\n\\x0B\\f\\r]+)\\s*$", Pattern.CASE_INSENSITIVE);
    
        /** Pattern for parsing disallow records. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractor.java

            this.authSchemeProviderMap = authSchemeProviderMap;
        }
    
        /**
         * Sets the user agent string.
         * @param userAgent The user agent string.
         */
        public void setUserAgent(final String userAgent) {
            this.userAgent = userAgent;
        }
    
        /**
         * Sets the credentials provider.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 12.2K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/suggest/index/contents/document/ESSourceReader.java

            }
    
            if (limitPercentage.endsWith("%")) {
                this.limitPercentage = Integer.parseInt(limitPercentage.substring(0, limitPercentage.length() - 1));
            } else {
                this.limitPercentage = Integer.parseInt(limitPercentage);
            }
    
            if (this.limitPercentage > 100) {
                this.limitPercentage = 100;
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 11K bytes
    - Viewed (0)
  5. src/test/java/org/codelibs/fess/suggest/index/contents/document/ESSourceReaderTest.java

            int count = 0;
            int prev = -1;
            Map<String, Object> source;
            while ((source = reader.read()) != null) {
                int current = Integer.parseInt(source.get("field2").toString());
                assertTrue(prev < current);
                prev = current;
                count++;
            }
            assertEquals(num, count);
    
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 9K bytes
    - Viewed (0)
  6. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    				"application/scvp-cv-request",
    				"application/scvp-cv-response",
    				"application/scvp-vp-request",
    				"application/scvp-vp-response",
    				"application/sdp",
    				"application/set-payment",
    				"application/set-payment-initiation",
    				"application/set-registration",
    				"application/set-registration-initiation",
    				"application/sgml",
    				"application/sgml-open-catalog",
    				"application/shf+xml",
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Aug 01 21:40:30 UTC 2020
    - 49K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractor.java

    import jakarta.mail.Address;
    import jakarta.mail.BodyPart;
    import jakarta.mail.Header;
    import jakarta.mail.Message;
    import jakarta.mail.MessagingException;
    import jakarta.mail.Multipart;
    import jakarta.mail.Part;
    import jakarta.mail.Session;
    import jakarta.mail.internet.MailDateFormat;
    import jakarta.mail.internet.MimeMessage;
    import jakarta.mail.internet.MimeUtility;
    
    /**
     * Gets a text from .eml file.
     *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.6K bytes
    - Viewed (0)
  8. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                tempDir.delete();
                tempDir.mkdirs();
    
                // robots.txt
                StringBuilder buf = new StringBuilder();
                buf.append("User-agent: *").append('\n');
                buf.append("Disallow: /admin/").append('\n');
                buf.append("Disallow: /websvn/").append('\n');
                final File robotTxtFile = new File(tempDir, "robots.txt");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/MultipleCrawlingAccessException.java

    /**
     * An exception that indicates multiple crawling access exceptions occurred.
     * This exception holds an array of Throwable objects representing the individual causes.
     * It extends CrawlingAccessException and provides methods to print the stack traces of all causes.
     *
     */
    public class MultipleCrawlingAccessException extends CrawlingAccessException {
    
        private static final long serialVersionUID = 1L;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.5K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                tempDir.delete();
                tempDir.mkdirs();
    
                // robots.txt
                StringBuilder buf = new StringBuilder();
                buf.append("User-agent: *").append('\n');
                buf.append("Disallow: /admin/").append('\n');
                buf.append("Disallow: /websvn/").append('\n');
                final File robotTxtFile = new File(tempDir, "robots.txt");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
Back to top