Search Options

Results per page
Sort
Preferred Languages
Advance

Results 51 - 60 of 65 for urlset (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImpl.java

    import org.codelibs.fess.crawler.service.UrlFilterService;
    
    import jakarta.annotation.Resource;
    
    /**
     * Implementation of the {@link UrlFilter} interface.
     * This class provides functionality to filter URLs based on include and exclude patterns.
     * It uses a {@link UrlFilterService} to manage the URL filtering rules.
     * The class supports caching of include and exclude patterns for scenarios where a session ID is not available.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/UrlQueue.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.entity;
    
    /**
     * The UrlQueue interface represents a queue of URLs to be processed by a web crawler.
     * It provides methods to get and set various properties of a URL queue entry.
     *
     * @param <IDTYPE> the type of the identifier for the URL queue entry
     */
    public interface UrlQueue<IDTYPE> {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 4.3K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/storage/StorageClient.java

     *   <li>writeTimeout - Write timeout in milliseconds (default: 10000)</li>
     *   <li>readTimeout - Read timeout in milliseconds (default: 10000)</li>
     * </ul>
     *
     * <p>The client supports URLs in the format: {@code storage://bucket-name/object-path}
     *
     * <p>Features:
     * <ul>
     *   <li>Automatic initialization of MinIO client</li>
     *   <li>Support for HEAD and GET operations</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 17.9K bytes
    - Viewed (2)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/MemoryDataHelper.java

        /** Map of session IDs to include URL patterns for filtering URLs. */
        protected volatile Map<String, List<Pattern>> includeUrlPatternMap = new HashMap<>();
    
        /** Map of session IDs to exclude URL patterns for filtering URLs. */
        protected volatile Map<String, List<Pattern>> excludeUrlPatternMap = new HashMap<>();
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.1K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb1/SmbClient.java

                                }
                            }
                        } catch (final Exception e) {
                            logger.warn(e.getLocalizedMessage());
                        }
                        buf.reset();
                    } else {
                        buf.write(b);
                    }
                }
            }));
        }
    
        /** The charset used for encoding and decoding. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Sep 18 09:30:45 UTC 2025
    - 23K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/pool/CrawlerPooledObjectFactoryTest.java

        private CrawlerPooledObjectFactory<TestComponent> factory;
        private StandardCrawlerContainer container;
    
        @Override
        protected void setUp() throws Exception {
            super.setUp();
    
            // Reset counters before each test
            TestComponent.resetCounter();
            SingletonTestComponent.resetInstanceCount();
    
            // Initialize container with test components
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19.3K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CrawlingParameterUtil.java

     *
     * <p>This class is final and cannot be instantiated.</p>
     *
     * <p>The following parameters are managed:</p>
     * <ul>
     *   <li>{@link UrlQueue} - The queue of URLs to be crawled.</li>
     *   <li>{@link CrawlerContext} - The context of the current crawling process.</li>
     *   <li>{@link UrlQueueService} - The service for managing the URL queue.</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.4K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/net/protocol/storage/Handler.java

    /**
     * Handler for the "storage" protocol, allowing access to objects stored in a MinIO-compatible storage service.
     * This handler extends {@link URLStreamHandler} to provide a way to open connections to storage objects
     * using URLs with the "storage" protocol.
     *
     * <p>
     * The URL format is expected to be: {@code storage://bucketName/objectName}.
     * The bucket name and object name are extracted from the URL.
     * </p>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.5K bytes
    - Viewed (0)
  9. fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/AbstractRuleTest.java

            public int getProcessCount() {
                return processCount;
            }
    
            public ResponseData getLastProcessedData() {
                return lastProcessedData;
            }
    
            public void reset() {
                processCount = 0;
                lastProcessedData = null;
            }
        }
    
        private StandardCrawlerContainer container;
        private TestRuleManager ruleManager;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 21.9K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/fs/FileSystemClient.java

         * @return the response data
         * @throws CrawlingAccessException if unable to access the URI
         * @throws ChildUrlsException if the URI represents a directory with child URLs
         */
        protected ResponseData getResponseData(final String uri, final boolean includeContent) {
            final ResponseData responseData = new ResponseData();
            try {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.8K bytes
    - Viewed (0)
Back to top