Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 56 for pattern2 (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/UrlFilterServiceImpl.java

         * (java.lang.String)
         */
        /**
         * Retrieves a list of URL patterns to be excluded for a given session.
         * @param sessionId The ID of the session.
         * @return A list of compiled regular expression patterns.
         */
        @Override
        public List<Pattern> getExcludeUrlPatternList(final String sessionId) {
            return dataHelper.getExcludeUrlPatternList(sessionId);
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  2. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

        </magic>
        <glob pattern="*.bin"/>
        <glob pattern="*.dms"/>
        <glob pattern="*.lha"/>
        <glob pattern="*.lrf"/>
        <glob pattern="*.lzh"/>
        <glob pattern="*.so"/>
        <glob pattern="*.dist"/>
        <glob pattern="*.distz"/>
        <glob pattern="*.pkg"/>
        <glob pattern="*.bpk"/>
        <glob pattern="*.dump"/>
        <glob pattern="*.elc"/>
        <glob pattern="*.deploy"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  3. .teamcity/src/main/kotlin/common/CommonExtensions.kt

     * @param historyDays days number of days to store build history .
     * @param artifactsDays number of days to store artifacts. In the stored history, artifacts older than this number will be cleaned up.
     * @param artifactPatterns patterns for artifacts clean-up. If not specified, all artifacts will be removed.
     */
    fun Project.cleanupRule(
        historyDays: Int,
        artifactsDays: Int,
        artifactsPatterns: String? = null,
    ) {
        features {
    Registered: Wed Sep 10 11:36:15 UTC 2025
    - Last Modified: Wed Sep 10 01:37:13 UTC 2025
    - 15K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

        /** Idle connection timeout in milliseconds */
        protected long idleConnectionTimeout = 60 * 1000L; // 1min
    
        /** Pattern for matching HTTP redirect status codes */
        protected Pattern redirectHttpStatusPattern = Pattern.compile("[3][0-9][0-9]");
    
        /** Whether to use robots.txt disallow rules */
        protected boolean useRobotsTxtDisallows = true;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 52.2K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/XmlExtractor.java

        /**
         * Pattern for XML tags.
         */
        protected Pattern xmlTagPattern = Pattern.compile("<[^>]+>");
    
        /**
         * Returns the encoding pattern.
         * @return The encoding pattern.
         */
        @Override
        protected Pattern getEncodingPattern() {
            return xmlEncodingPattern;
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

        protected static final Pattern ALLOW_RECORD = Pattern.compile("^allow:\\s*([^\\s]*)\\s*$", Pattern.CASE_INSENSITIVE);
    
        /** Pattern for parsing crawl-delay records. */
        protected static final Pattern CRAWL_DELAY_RECORD = Pattern.compile("^crawl-delay:\\s*([^\\s]+)\\s*$", Pattern.CASE_INSENSITIVE);
    
        /**
         * Pattern for Sitemap record.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  7. README.md

    crawler.crawlerContext.setDefaultIntervalTime(1000); // 1 second
    ```
    
    ### URL Filtering
    
    ```java
    // Include patterns
    crawler.urlFilter.addInclude("https://example.com/.*");
    crawler.urlFilter.addInclude(".*\\.pdf$");
    
    // Exclude patterns  
    crawler.urlFilter.addExclude(".*\\.js$");
    crawler.urlFilter.addExclude(".*login.*");
    ```
    
    ## Supported Protocols and Formats
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/form/FormScheme.java

        }
    
        /**
         * Extracts the token value from the content using the given pattern.
         * @param tokenPattern The regex pattern.
         * @param content The content to search.
         * @return The extracted token value.
         */
        protected String getTokenValue(final String tokenPattern, final String content) {
            final Matcher matcher = Pattern.compile(tokenPattern).matcher(content);
            if (matcher.find()) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.3K bytes
    - Viewed (1)
  9. src/buildall.bash

    if [ "$sete" = true ]; then
    	set -e
    fi
    
    pattern="$1"
    if [ "$pattern" = "" ]; then
    	pattern=.
    fi
    
    ./make.bash || exit 1
    GOROOT="$(cd .. && pwd)"
    
    gettargets() {
    	../bin/go tool dist list | sed -e 's|/|-|' |
    		grep -E -v '^(android|ios)' # need C toolchain even for cross-compiling
    	echo linux-arm-arm5
    }
    
    selectedtargets() {
    	gettargets | grep -E "$pattern"
    }
    
    Registered: Tue Sep 09 11:13:09 UTC 2025
    - Last Modified: Tue Apr 23 17:45:23 UTC 2024
    - 2.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/UrlFilter.java

         * @param url URL
         * @return true if url is matched
         */
        boolean match(String url);
    
        /**
         * Add an url pattern as a target.
         *
         * @param urlPattern Regular expression that is crawled
         */
        void addInclude(String urlPattern);
    
        /**
         * Add an url pattern as a non-target.
         *
         * @param urlPattern Regular expression that is not crawled
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.6K bytes
    - Viewed (0)
Back to top