- Sort Score
- Result 10 results
- Languages All
Results 51 - 60 of 65 for urlset (0.05 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImpl.java
import org.codelibs.fess.crawler.service.UrlFilterService; import jakarta.annotation.Resource; /** * Implementation of the {@link UrlFilter} interface. * This class provides functionality to filter URLs based on include and exclude patterns. * It uses a {@link UrlFilterService} to manage the URL filtering rules. * The class supports caching of include and exclude patterns for scenarios where a session ID is not available.Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 9.2K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/UrlQueue.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.entity; /** * The UrlQueue interface represents a queue of URLs to be processed by a web crawler. * It provides methods to get and set various properties of a URL queue entry. * * @param <IDTYPE> the type of the identifier for the URL queue entry */ public interface UrlQueue<IDTYPE> {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 4.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/storage/StorageClient.java
* <li>writeTimeout - Write timeout in milliseconds (default: 10000)</li> * <li>readTimeout - Read timeout in milliseconds (default: 10000)</li> * </ul> * * <p>The client supports URLs in the format: {@code storage://bucket-name/object-path} * * <p>Features: * <ul> * <li>Automatic initialization of MinIO client</li> * <li>Support for HEAD and GET operations</li>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 17.9K bytes - Viewed (2) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/MemoryDataHelper.java
/** Map of session IDs to include URL patterns for filtering URLs. */ protected volatile Map<String, List<Pattern>> includeUrlPatternMap = new HashMap<>(); /** Map of session IDs to exclude URL patterns for filtering URLs. */ protected volatile Map<String, List<Pattern>> excludeUrlPatternMap = new HashMap<>(); /**Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 8.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb1/SmbClient.java
} } } catch (final Exception e) { logger.warn(e.getLocalizedMessage()); } buf.reset(); } else { buf.write(b); } } })); } /** The charset used for encoding and decoding. */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Sep 18 09:30:45 UTC 2025 - 23K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/pool/CrawlerPooledObjectFactoryTest.java
private CrawlerPooledObjectFactory<TestComponent> factory; private StandardCrawlerContainer container; @Override protected void setUp() throws Exception { super.setUp(); // Reset counters before each test TestComponent.resetCounter(); SingletonTestComponent.resetInstanceCount(); // Initialize container with test componentsRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Wed Sep 03 14:42:53 UTC 2025 - 19.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CrawlingParameterUtil.java
* * <p>This class is final and cannot be instantiated.</p> * * <p>The following parameters are managed:</p> * <ul> * <li>{@link UrlQueue} - The queue of URLs to be crawled.</li> * <li>{@link CrawlerContext} - The context of the current crawling process.</li> * <li>{@link UrlQueueService} - The service for managing the URL queue.</li>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 6.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/net/protocol/storage/Handler.java
/** * Handler for the "storage" protocol, allowing access to objects stored in a MinIO-compatible storage service. * This handler extends {@link URLStreamHandler} to provide a way to open connections to storage objects * using URLs with the "storage" protocol. * * <p> * The URL format is expected to be: {@code storage://bucketName/objectName}. * The bucket name and object name are extracted from the URL. * </p> * * <p>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10.5K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/AbstractRuleTest.java
public int getProcessCount() { return processCount; } public ResponseData getLastProcessedData() { return lastProcessedData; } public void reset() { processCount = 0; lastProcessedData = null; } } private StandardCrawlerContainer container; private TestRuleManager ruleManager;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Wed Sep 03 14:42:53 UTC 2025 - 21.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/fs/FileSystemClient.java
* @return the response data * @throws CrawlingAccessException if unable to access the URI * @throws ChildUrlsException if the URI represents a directory with child URLs */ protected ResponseData getResponseData(final String uri, final boolean includeContent) { final ResponseData responseData = new ResponseData(); try {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 13.8K bytes - Viewed (0)