Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 67 for batter (0.03 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java

            assertEquals(20, context.getMaxThreadCheckCount());
            assertEquals(-1, context.getMaxDepth());
            assertEquals(0L, context.getMaxAccessCount());
        }
    
        /**
         * Test sessionId getter and setter
         */
        public void test_sessionId() {
            assertNull(crawlerContext.getSessionId());
    
            crawlerContext.setSessionId("test-session-001");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 25.6K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

        protected static final Pattern ALLOW_RECORD = Pattern.compile("^allow:\\s*([^\\s]*)\\s*$", Pattern.CASE_INSENSITIVE);
    
        /** Pattern for parsing crawl-delay records. */
        protected static final Pattern CRAWL_DELAY_RECORD = Pattern.compile("^crawl-delay:\\s*([^\\s]+)\\s*$", Pattern.CASE_INSENSITIVE);
    
        /**
         * Pattern for Sitemap record.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

        /**
         * Test adding invalid regex include pattern
         */
        public void test_addInclude_invalidRegex() {
            String sessionId = "test-session-004";
            urlFilter.init(sessionId);
    
            // Invalid regex pattern should be handled gracefully
            urlFilter.addInclude(".*[invalid");
            urlFilter.addInclude("https://valid.com/.*");
    
            // Valid pattern should still work
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  4. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

        </magic>
        <glob pattern="*.bin"/>
        <glob pattern="*.dms"/>
        <glob pattern="*.lha"/>
        <glob pattern="*.lrf"/>
        <glob pattern="*.lzh"/>
        <glob pattern="*.so"/>
        <glob pattern="*.dist"/>
        <glob pattern="*.distz"/>
        <glob pattern="*.pkg"/>
        <glob pattern="*.bpk"/>
        <glob pattern="*.dump"/>
        <glob pattern="*.elc"/>
        <glob pattern="*.deploy"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

         * @return the parsed charset name, or null if not found
         */
        protected String parseCharset(final String content) {
            final Pattern pattern = Pattern.compile("; *charset *= *([a-zA-Z0-9\\-_]+)", Pattern.CASE_INSENSITIVE);
            final Matcher matcher = pattern.matcher(content);
            if (matcher.find()) {
                return matcher.group(1);
            }
            return null;
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 28.5K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/AbstractRule.java

     * Provides common functionality and properties for crawler rules.
     *
     * <p>
     * This class handles the registration of rules with the {@link RuleManager}
     * and provides getter and setter methods for common properties such as
     * {@code ruleId} and {@code responseProcessor}.
     * </p>
     *
     * <p>
     * Subclasses should extend this class and implement the abstract methods
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 2.8K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/impl/AuthenticationImpl.java

     * This class provides methods to handle authentication details such as
     * authentication scope, credentials, and authentication scheme.
     *
     * <p>
     * It includes constructors to initialize these details and getter and setter
     * methods to access and modify them.
     * </p>
     *
     * <p>
     * Example usage:
     * </p>
     * <pre>
     * {@code
     * AuthScope authScope = new AuthScope("example.com", 80);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.8K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/MemoryDataHelper.java

        }
    
        /**
         * Adds an include URL pattern for the specified session.
         * @param sessionId the session ID
         * @param url the URL pattern to include
         */
        public synchronized void addIncludeUrlPattern(final String sessionId, final String url) {
            final List<Pattern> patternList = getIncludeUrlPatternList(sessionId);
            patternList.add(Pattern.compile(url));
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.1K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/XmlExtractor.java

        /**
         * Pattern for XML tags.
         */
        protected Pattern xmlTagPattern = Pattern.compile("<[^>]+>");
    
        /**
         * Returns the encoding pattern.
         * @return The encoding pattern.
         */
        @Override
        protected Pattern getEncodingPattern() {
            return xmlEncodingPattern;
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImpl.java

            final List<Pattern> includeList = getUrlFilterService().getIncludeUrlPatternList(sessionId);
            final List<Pattern> excludeList = getUrlFilterService().getExcludeUrlPatternList(sessionId);
    
            if (!includeList.isEmpty()) {
                boolean match = false;
                for (final Pattern pattern : includeList) {
                    final Matcher matcher = pattern.matcher(url);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.2K bytes
    - Viewed (0)
Back to top