Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 109 for url (0.01 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

                url = url.substring(0, idx);
            }
    
            url = url.replace("/./", "/");
    
            idx = url.indexOf(";jsessionid");
            if (idx >= 0) {
                url = url.replaceFirst(";jsessionid=[a-zA-Z0-9\\.]*", "");
            }
    
            if (url.indexOf(' ') >= 0) {
                url = url.replace(" ", "%20");
            }
    
            String oldUrl = null;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Nov 29 07:42:33 UTC 2025
    - 30.5K bytes
    - Viewed (0)
  2. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueService.java

         * Checks if a URL exists in the queue by searching OpenSearch and local caches.
         *
         * @param sessionId The session ID.
         * @param url The URL to check.
         * @return true if the URL exists in the queue, false otherwise.
         */
        @Override
        protected boolean exists(final String sessionId, final String url) {
            final boolean ret = super.exists(sessionId, url);
            if (!ret) {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 20 08:40:57 UTC 2025
    - 16.9K bytes
    - Viewed (1)
  3. fess-crawler/src/main/java/org/codelibs/fess/net/protocol/s3/Handler.java

             * Constructs a new S3URLConnection for the specified URL.
             * This constructor parses the URL to extract bucket and object names.
             *
             * @param url The S3 URL to connect to
             */
            protected S3URLConnection(final URL url) {
                super(url);
                // Extract bucket name from host
                bucketName = url.getHost() != null ? url.getHost() : StringUtil.EMPTY;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Dec 11 07:57:44 UTC 2025
    - 9.5K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/net/protocol/gcs/Handler.java

             * Constructs a new GcsURLConnection for the specified URL.
             * This constructor parses the URL to extract bucket and object names.
             *
             * @param url The GCS URL to connect to
             */
            protected GcsURLConnection(final URL url) {
                super(url);
                // Extract bucket name from host
                bucketName = url.getHost() != null ? url.getHost() : StringUtil.EMPTY;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Dec 11 08:38:29 UTC 2025
    - 9.6K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/SitemapsHelperTest.java

                            + "  <url>\n" + "    <loc>http://www.example.com/page1.html</loc>\n" + "    <lastmod>2025-01-01</lastmod>\n"
                            + "    <priority>0.8</priority>\n" + "  </url>\n" + "  <url>\n" + "    <loc></loc>\n" + "  </url>\n" + "  <url>\n"
                            + "    <loc>http://www.example.com/page2.html</loc>\n" + "    <changefreq>daily</changefreq>\n" + "  </url>\n"
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 36.7K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/net/protocol/storage/Handler.java

             * This constructor parses the URL to extract bucket and object names.
             *
             * @param url The storage URL to connect to
             */
            protected StorageURLConnection(final URL url) {
                super(url);
                // Extract bucket name from host
                bucketName = url.getHost() != null ? url.getHost() : StringUtil.EMPTY;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 20 08:52:56 UTC 2025
    - 11.1K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/crawler/transformer/AbstractFessFileTransformer.java

        /**
         * Get the host on file.
         * @param url The URL.
         * @return The host on file.
         */
        protected String getHostOnFile(final String url) {
            if (StringUtil.isBlank(url)) {
                return StringUtil.EMPTY; // empty
            }
    
            if (url.startsWith("file:////")) {
                final String value = decodeUrlAsName(url.substring(9), true);
                final int pos = value.indexOf('/');
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 25.7K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/DefaultIntervalController.java

        /** Delay in milliseconds after processing a URL */
        protected long delayMillisAfterProcessing = 0L;
    
        /** Delay in milliseconds when no URL is in the queue */
        protected long delayMillisAtNoUrlInQueue = 500L;
    
        /** Delay in milliseconds before processing a URL */
        protected long delayMillisBeforeProcessing = 0L;
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 20 08:58:39 UTC 2025
    - 5.8K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/helper/ProtocolHelper.java

            return url.startsWith("file:") || url.startsWith("smb:") || url.startsWith("smb1:") || url.startsWith("ftp:")
                    || url.startsWith("storage:") || url.startsWith("s3:") || url.startsWith("gcs:");
        }
    
        /**
         * Checks if the given URL should skip URL decoding when extracting file names.
         * Some protocols (like SMB, FTP, S3, GCS) should preserve the original URL encoding.
         *
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Dec 12 13:58:40 UTC 2025
    - 12.4K bytes
    - Viewed (1)
  10. src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java

         * This method applies duplicate host conversion before storing the URL.
         *
         * @param childUrl the child URL to store
         * @param parentUrl the parent URL that referenced this child URL
         * @param weight the weight/priority of the child URL
         * @param depth the crawling depth of the child URL
         */
        @Override
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Dec 11 09:47:03 UTC 2025
    - 19.5K bytes
    - Viewed (0)
Back to top