- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 29 for Burles (0.03 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/UrlConvertHelper.java
/** * Helper class for converting URLs based on a set of predefined rules. * * <p>This class provides functionality to convert URLs by replacing parts of the URL * based on a map of target strings and their corresponding replacements. It allows * adding new conversion rules, setting the entire conversion map, and converting * URLs using these rules.</p> *
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/impl/UrlFilterImpl.java
import jakarta.annotation.Resource; /** * Implementation of the {@link UrlFilter} interface. * This class provides functionality to filter URLs based on include and exclude patterns. * It uses a {@link UrlFilterService} to manage the URL filtering rules. * The class supports caching of include and exclude patterns for scenarios where a session ID is not available.Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 9.2K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java
} /** * Returns the set of robots.txt URLs. * @return The set of robots.txt URLs. */ public Set<String> getRobotsTxtUrlSet() { return robotsTxtUrlSet; } /** * Sets the set of robots.txt URLs. * @param robotsTxtUrlSet The set of robots.txt URLs. */ public void setRobotsTxtUrlSet(final Set<String> robotsTxtUrlSet) {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 8.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/RuleManager.java
*/ package org.codelibs.fess.crawler.rule; import org.codelibs.fess.crawler.entity.ResponseData; /** * The RuleManager interface provides methods to manage rules for processing response data. * It allows adding, retrieving, and removing rules, as well as checking for their existence. */ public interface RuleManager { /** * Retrieves the rule associated with the given response data. *Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java
import jakarta.annotation.Resource; /** * A response processor implementation that handles sitemaps. * It parses the response body as a SitemapSet, extracts URLs from the sitemaps, * and adds them as child URLs to be crawled. * * <p> * This class uses a {@link SitemapsHelper} to parse the sitemap XML or text. * It then iterates through the sitemaps in the SitemapSet, extracts the URLRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/Rule.java
import java.io.Serializable; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.processor.ResponseProcessor; /** * The Rule interface defines the contract for implementing rules that can be applied to * response data in a web crawler. Implementations of this interface should provide logic * to determine if a given response data matches the rule, retrieve the rule's identifier,
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 1.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/IntervalController.java
* <li>{@code POST_PROCESSING} - Represents the post-processing state.</li> * <li>{@code NO_URL_IN_QUEUE} - Indicates that there are no URLs in the queue.</li> * <li>{@code WAIT_NEW_URL} - Indicates that the crawler is waiting for new URLs.</li> * </ul> */ public interface IntervalController { /** Constant representing the pre-processing state. */ int PRE_PROCESSING = 1;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/ChildUrlsException.java
/** * {@link ChildUrlsException} is thrown when child URLs are found during crawling. * It extends {@link CrawlerSystemException} and holds a set of {@link RequestData} * representing the child URLs that caused the exception. * */ public class ChildUrlsException extends CrawlerSystemException { private static final long serialVersionUID = 1L; /** * The list of child URLs. */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/RuleManagerImpl.java
import org.codelibs.fess.crawler.rule.RuleManager; /** * Implementation of the {@link RuleManager} interface. * Manages a list of rules for the crawler. * Provides methods to add, remove, check, and retrieve rules. * */ public class RuleManagerImpl implements RuleManager { /** The list of rules managed by this rule manager. */ protected final List<Rule> ruleList = new ArrayList<>(); /**Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientCreator.java
} } /** * Registers a client component with a regular expression. * The component will be loaded into all registered CrawlerClientFactories. * @param regex The regular expression to match URLs. * @param componentName The name of the component to register. */ public synchronized void register(final String regex, final String componentName) { clientMap.put(regex, componentName);Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.5K bytes - Viewed (0)