- Sort Score
- Result 10 results
- Languages All
Results 21 - 30 of 65 for urlset (0.02 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/ChildUrlsException.java
/** * {@link ChildUrlsException} is thrown when child URLs are found during crawling. * It extends {@link CrawlerSystemException} and holds a set of {@link RequestData} * representing the child URLs that caused the exception. * */ public class ChildUrlsException extends CrawlerSystemException { private static final long serialVersionUID = 1L; /** * The list of child URLs. */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/IntervalController.java
* <li>{@code POST_PROCESSING} - Represents the post-processing state.</li> * <li>{@code NO_URL_IN_QUEUE} - Indicates that there are no URLs in the queue.</li> * <li>{@code WAIT_NEW_URL} - Indicates that the crawler is waiting for new URLs.</li> * </ul> */ public interface IntervalController { /** Constant representing the pre-processing state. */ int PRE_PROCESSING = 1;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientCreator.java
} } /** * Registers a client component with a regular expression. * The component will be loaded into all registered CrawlerClientFactories. * @param regex The regular expression to match URLs. * @param componentName The name of the component to register. */ public synchronized void register(final String regex, final String componentName) { clientMap.put(regex, componentName);Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/service/UrlFilterService.java
*/ void addIncludeUrlFilter(String sessionId, String url); /** * Adds a list of URLs to the include filter for a given session. * * @param sessionId the ID of the session for which the URLs should be included * @param urlList the list of URLs to be added to the include filter */ void addIncludeUrlFilter(String sessionId, List<String> urlList); /**Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 3.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java
InputStream in = null; try { if (isByteStream) { inputStream.reset(); in = inputStream; } else { in = new FileInputStream(tempFile); }Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 30.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java
} /** * Returns the set of robots.txt URLs. * @return The set of robots.txt URLs. */ public Set<String> getRobotsTxtUrlSet() { return robotsTxtUrlSet; } /** * Sets the set of robots.txt URLs. * @param robotsTxtUrlSet The set of robots.txt URLs. */ public void setRobotsTxtUrlSet(final Set<String> robotsTxtUrlSet) {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 8.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ResultData.java
protected String transformerName; /** The data of the result. */ protected byte[] data; /** The encoding of the result. */ protected String encoding; /** The set of the child URLs. */ protected Set<RequestData> childUrlSet = new LinkedHashSet<>(); /** The raw data. */ protected Object rawData = null; /** The serializer. */ protected Function<Object, byte[]> serializer;Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.7K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/AbstractTransformerTest.java
assertEquals("http://example.com/test", transformer.getLastResponseData().getUrl()); // Reset and verify transformer.reset(); assertEquals(0, transformer.getTransformCallCount()); assertNull(transformer.getLastResponseData()); // Name should persist after reset assertEquals("workflowTransformer", transformer.getName()); }
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 20.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/log/LogType.java
REDIRECT_LOCATION, /** Indicates processing a response. */ PROCESS_RESPONSE, /** Indicates the crawling process has finished. */ FINISHED_CRAWLING, /** Indicates processing child URLs due to an exception. */ PROCESS_CHILD_URLS_BY_EXCEPTION, /** Indicates processing a child URL due to an exception. */ PROCESS_CHILD_URL_BY_EXCEPTION, /** Indicates an access exception during crawling. */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java
* influence the position of your URLs in a search engine's result pages. * Search engines may use this information when selecting between URLs on * the same site, so you can use this tag to increase the likelihood that * your most important pages are present in a search index. * * Also, please note that assigning a high priority to all of the URLs on
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 6.5K bytes - Viewed (0)