Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 18 for m_regex (0.04 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientFactory.java

                }
            }
        }
    
        /**
         * Adds a client with a regular expression pattern.
         * @param regex The regular expression to match URLs.
         * @param client The CrawlerClient instance.
         */
        public void addClient(final String regex, final CrawlerClient client) {
            if (StringUtil.isBlank(regex)) {
                throw new CrawlerSystemException("A regular expression is null.");
            }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PasswordBasedExtractor.java

         * Adds a password for files matching the given regular expression pattern.
         * @param regex the regular expression pattern to match against URLs or resource names
         * @param password the password to use for matching files
         */
        public void addPassword(final String regex, final String password) {
            passwordMap.put(Pattern.compile(regex), password);
        }
    
        /**
         * Returns the password for the given parameters.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 5.1K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientCreator.java

         * @param regex The regular expression to match URLs.
         * @param componentName The name of the component to register.
         */
        public synchronized void register(final String regex, final String componentName) {
            clientMap.put(regex, componentName);
            clientFactoryList.forEach(f -> load(f, regex, componentName));
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientFactoryWrapper.java

         * @param regex The regular expression for the client.
         * @param client The CrawlerClient instance.
         */
        @Override
        public void addClient(final String regex, final CrawlerClient client) {
            factory.addClient(regex, client);
        }
    
        /**
         * Adds a client to the wrapped factory at a specific position.
         * @param regex The regular expression for the client.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5.2K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/RegexRule.java

        /**
         * Adds a regular expression rule for the specified field.
         * @param key the field name to match against
         * @param regex the regular expression pattern
         */
        public void addRule(final String key, final String regex) {
            regexMap.put(key, Pattern.compile(regex));
        }
    
        /**
         * Adds a compiled regular expression rule for the specified field.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.2K bytes
    - Viewed (0)
  6. src/test/java/org/codelibs/opensearch/extension/analysis/PatternConcatenationFilterFactory.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.opensearch.extension.analysis;
    
    import java.util.regex.Pattern;
    
    import org.apache.lucene.analysis.TokenStream;
    import org.codelibs.analysis.ja.PatternConcatenationFilter;
    import org.opensearch.common.settings.Settings;
    import org.opensearch.env.Environment;
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sat Mar 15 06:51:20 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImpl.java

     */
    package org.codelibs.fess.crawler.filter.impl;
    
    import java.util.LinkedHashSet;
    import java.util.List;
    import java.util.Set;
    import java.util.regex.Matcher;
    import java.util.regex.Pattern;
    import java.util.stream.Collectors;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.container.CrawlerContainer;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

    import java.io.BufferedReader;
    import java.io.InputStream;
    import java.io.InputStreamReader;
    import java.util.ArrayList;
    import java.util.List;
    import java.util.Locale;
    import java.util.regex.Matcher;
    import java.util.regex.Pattern;
    
    import org.apache.commons.io.input.BOMInputStream;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.RobotsTxt;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/XmlExtractor.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.util.regex.Pattern;
    
    /**
     * Extracts text content from XML documents.
     */
    public class XmlExtractor extends AbstractXmlExtractor {
    
        /**
         * Creates a new XmlExtractor instance.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/SitemapsRule.java

     * represents a valid sitemap. It uses a SitemapsHelper to validate the response body as an InputStream.
     * The rule checks if the URL matches the defined regex pattern and then validates the content as a sitemap.
     * If any exception occurs during the sitemap validation, it logs the error and returns false.
     *
     */
    public class SitemapsRule extends RegexRule {
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
Back to top