Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 39 for supported (0.06 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/AbstractCrawlerClient.java

            throw new CrawlerSystemException("GET method is not supported.");
        }
    
        /**
         * Performs a HEAD request.
         * @param url The URL to request.
         * @return The ResponseData.
         */
        protected ResponseData doHead(final String url) {
            throw new CrawlerSystemException("HEAD method is not supported.");
        }
    
        /**
         * Performs a POST request.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 9.7K bytes
    - Viewed (10)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/UnsupportedExtractException.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.exception;
    
    /**
     * UnsupportedExtractException is thrown when the content extraction is not supported.
     * It extends ExtractException and indicates that the requested extraction operation cannot be performed.
     *
     */
    public class UnsupportedExtractException extends ExtractException {
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.2K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RequestData.java

    /**
     * Represents a request data for crawling.
     * This class encapsulates the HTTP method, URL, and weight associated with a crawling request.
     */
    public class RequestData {
        /**
         * HTTP methods supported for crawling requests.
         */
        public enum Method {
            /** HTTP GET method. */
            GET,
            /** HTTP POST method. */
            POST,
            /** HTTP HEAD method. */
            HEAD;
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4K bytes
    - Viewed (0)
  4. README.md

    crawler.urlFilter.addInclude(".*\\.pdf$");
    
    // Exclude patterns  
    crawler.urlFilter.addExclude(".*\\.js$");
    crawler.urlFilter.addExclude(".*login.*");
    ```
    
    ## Supported Protocols and Formats
    
    ### Protocols
    - **HTTP/HTTPS**: Full web crawling support with cookies, authentication, redirects
    - **File System**: Local and network file system access
    - **FTP**: FTP server crawling with authentication
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

            }
        }
    
        /**
         * Checks if the specified charset is supported.
         *
         * @param charsetName the charset name to check
         * @return true if the charset is supported, false otherwise
         */
        protected boolean isSupportedCharset(final String charsetName) {
            if (charsetName == null) {
                return false;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 28.5K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java

         * @return The result data body.
         */
        protected String getResultDataBody(final String name, final String value) {
            // TODO: Support other XML footer types
            // TODO: Support other field types and trimming options
            return "<field name=\"" + XmlUtil.escapeXml(name) + "\">" + trimSpace(XmlUtil.escapeXml(value != null ? value : "")) + "</field>\n";
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.1K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java

    import org.xml.sax.SAXNotRecognizedException;
    import org.xml.sax.SAXNotSupportedException;
    import org.xml.sax.helpers.DefaultHandler;
    
    /**
     * Helper class for parsing and validating sitemaps.
     * It supports XML sitemaps, XML sitemap indexes, and text sitemaps,
     * and can handle GZIP compressed sitemaps.
     * The class provides methods to check if an input stream is a valid sitemap,
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.7K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/IgnoreCloseInputStream.java

         */
        @Override
        public synchronized void mark(final int readlimit) {
            inputStream.mark(readlimit);
        }
    
        /**
         * Tests if this input stream supports the mark and reset methods.
         *
         * @return true if this stream instance supports the mark and reset methods; false otherwise
         */
        @Override
        public boolean markSupported() {
            return inputStream.markSupported();
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5.3K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorFactory.java

     * extractor that iterates through the available extractors until one successfully
     * extracts the data.
     * </p>
     *
     * <p>
     * The class uses a {@link CrawlerContainer} for managing crawler components and
     * supports dependency injection via the {@link Resource} annotation.
     * </p>
     */
    public class ExtractorFactory {
    
        /** Logger instance for this class */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.3K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/storage/StorageClient.java

     *   <li>readTimeout - Read timeout in milliseconds (default: 10000)</li>
     * </ul>
     *
     * <p>The client supports URLs in the format: {@code storage://bucket-name/object-path}
     *
     * <p>Features:
     * <ul>
     *   <li>Automatic initialization of MinIO client</li>
     *   <li>Support for HEAD and GET operations</li>
     *   <li>Content length validation</li>
     *   <li>MIME type detection</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 17.9K bytes
    - Viewed (2)
Back to top