- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 29 for replay (0.05 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java
} /** * Gets the crawl delay value for the specified user agent from robots.txt. * The crawl delay specifies the time (in seconds) to wait between successive requests. * * @param userAgent The user agent string to match against robots.txt directives * @return The crawl delay value in seconds. Returns 0 if no matching directive is found * or no crawl delay is specified for the matching directive. */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/util/XmlUtil.java
return stripInvalidXMLCharacters(// value// .replace("&", "&") // .replace("<", "<")// .replace(">", ">")// .replace("\"", """)// .replace("\'", "'")// ); } /** * Strips invalid XML characters from the input string.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 9.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/IntervalController.java
int NO_URL_IN_QUEUE = 4; /** Constant indicating that the crawler is waiting for new URLs. */ int WAIT_NEW_URL = 8; /** * Introduces a delay based on the specified type. * * @param type the type of delay to be introduced */ void delay(int type);Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/DefaultIntervalController.java
/** Delay in milliseconds after processing a URL */ protected long delayMillisAfterProcessing = 0L; /** Delay in milliseconds when no URL is in the queue */ protected long delayMillisAtNoUrlInQueue = 500L; /** Delay in milliseconds before processing a URL */ protected long delayMillisBeforeProcessing = 0L; /** Delay in milliseconds for waiting for new URLs */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.4K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/AbstractIntervalController.java
* * <p> * Subclasses are responsible for implementing the abstract methods to define the actual delay * mechanism for each of these stages. * </p> * * <p> * The class also provides a mechanism to ignore exceptions that may occur during the delay process. * If {@link #ignoreException} is set to true, any exceptions thrown during the delay will be caught * and ignored. Otherwise, they will be re-thrown as {@link CrawlerSystemException}.Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/FileTransformer.java
*/ protected String path; /** * A string to replace ?. */ protected String questionStr = "_QUEST_"; /** * A string to replace :. */ protected String colonStr = "_CLN_"; /** * A string to replace ;. */ protected String semicolonStr = "_SCLN_"; /** * A string to replace &. */ protected String ampersandStr = "_AMP_";Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 11.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/HostIntervalController.java
* The delayBeforeProcessing method is overridden to introduce a delay before processing a URL, * ensuring that requests to the same host are not made too frequently. * The delay is calculated based on the configured delayMillisBeforeProcessing parameter. * If the time since the last request to the host is less than the configured delay, * the thread waits until the delay has elapsed. * This class is thread-safe. */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.2K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/client/fs/FileSystemClientTest.java
} public void test_doGet_dir() { final File file = ResourceUtil.getResourceAsFile("test"); String path = file.getAbsolutePath(); if (!path.startsWith("/")) { path = "/" + path.replace('\\', '/'); } try { fsClient.doGet("file://" + path); fail(); } catch (final ChildUrlsException e) { final Set<RequestData> urlSet = e.getChildUrlList();Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java
String input = content.replaceAll("[\\r\\n]", " "); if (ignoreCommentTag) { input = input.replaceAll("<!--[^>]+-->", ""); } else { input = input.replace("<!--", "").replace("-->", ""); } final Matcher matcher = getTagPattern().matcher(input); final StringBuffer sb = new StringBuffer(); final Pattern attrPattern = Pattern.compile("\\s[^ ]+=\"([^\"]*)\"");
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 8.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java
protected static final Pattern ALLOW_RECORD = Pattern.compile("^allow:\\s*([^\\s]*)\\s*$", Pattern.CASE_INSENSITIVE); /** Pattern for parsing crawl-delay records. */ protected static final Pattern CRAWL_DELAY_RECORD = Pattern.compile("^crawl-delay:\\s*([^\\s]+)\\s*$", Pattern.CASE_INSENSITIVE); /** * Pattern for Sitemap record. */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 7.7K bytes - Viewed (0)