Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 28 for found (0.01 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

        /** Map of user agent patterns to their corresponding directives. */
        protected final Map<Pattern, Directive> directiveMap = new LinkedHashMap<>();
    
        /** List of sitemap URLs found in the robots.txt file. */
        private final List<String> sitemapList = new ArrayList<>();
    
        /**
         * Creates a new RobotsTxt instance.
         */
        public RobotsTxt() {
            // Default constructor
        }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/XPathAPI.java

        }
    
        /**
         * Use an XPath string to select a single node.
         *
         * @param contextNode The node to start searching from.
         * @param expression A valid XPath string.
         * @return The first node found that matches the XPath, or null.
         *
         * @throws XPathExpressionException if an XPath expression error occurs.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.6K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/ChildUrlsException.java

     */
    package org.codelibs.fess.crawler.exception;
    
    import java.util.Set;
    
    import org.codelibs.fess.crawler.entity.RequestData;
    
    /**
     * {@link ChildUrlsException} is thrown when child URLs are found during crawling.
     * It extends {@link CrawlerSystemException} and holds a set of {@link RequestData}
     * representing the child URLs that caused the exception.
     *
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.8K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

            if (cachedXPathAPI == null) {
                cachedXPathAPI = new XPathAPI();
                xpathAPI.set(cachedXPathAPI);
            }
            return cachedXPathAPI;
        }
    
        /**
         * Stores child URLs found in the HTML content.
         *
         * @param responseData the response data containing the HTML content
         * @param resultData the result data to store child URLs in
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 28.5K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb1/SmbAuthenticationHolder.java

        }
    
        /**
         * Retrieves an SMB authentication configuration that matches the given path.
         * @param path The path to match.
         * @return The matching SmbAuthentication object, or null if no match is found.
         */
        public SmbAuthentication get(final String path) {
            if (path == null) {
                return null;
            }
    
            for (final Map.Entry<String, SmbAuthentication> entry : authMap.entrySet()) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.2K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorFactory.java

         * that tries each extractor in order until one succeeds.
         *
         * @param key the key to look up
         * @return the extractor for the key, or null if not found
         */
        public Extractor getExtractor(final String key) {
            final Extractor[] extractors = extractorMap.get(key);
            if (extractors == null || extractors.length == 0) {
                return null;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.3K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/AbstractCrawlerClient.java

         * @param <T> The type of the parameter.
         * @param key The key of the parameter.
         * @param defaultValue The default value if the parameter is not found.
         * @param clazz The class type to convert the parameter to.
         * @return The parameter value, or the default value if not found.
         */
        protected <T> T getInitParameter(final String key, final T defaultValue, final Class<T> clazz) {
            if (initParamMap != null) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 9.7K bytes
    - Viewed (10)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ExtractData.java

        }
    
        /**
         * Gets the values associated with a given key from the metadata.
         *
         * @param key the metadata key
         * @return the values associated with the key, or null if not found
         */
        public String[] getValues(final String key) {
            return metadata.get(key);
        }
    
        /**
         * Gets the set of all metadata keys.
         *
         * @return the set of metadata keys
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 3.8K bytes
    - Viewed (0)
  9. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/AbstractCrawlerService.java

         * @param clazz The class of the object to retrieve.
         * @param sessionId The session ID of the document.
         * @param url The URL of the document.
         * @return The retrieved object, or null if not found.
         * @throws OpenSearchAccessException if the retrieval fails.
         */
        protected <T> T get(final Class<T> clazz, final String sessionId, final String url) {
            final String id = getId(sessionId, url);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 34.2K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractor.java

        }
    
        /**
         * Gets the received date from a message by parsing the received headers.
         *
         * @param message the message to get the received date from
         * @return the received date or null if not found
         * @throws MessagingException if message access fails
         */
        protected static Date getReceivedDate(final Message message) throws MessagingException {
            final Date today = new Date();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.6K bytes
    - Viewed (0)
Back to top