- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 13 for UrlSet (0.04 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapSet.java
/** * Represents a set of Sitemaps, which can be either a UrlSet or an Index. * This class provides methods to manage a list of Sitemap objects and determine the type of the SitemapSet. * */ public class SitemapSet implements Serializable { private static final long serialVersionUID = 1L; /** Constant for UrlSet type. */ public static final String URLSET = "UrlSet"; /** Constant for Index type. */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2.9K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/client/ftp/FtpClientTest.java
fail(); } catch (final ChildUrlsException e) { final Set<RequestData> urlSet = e.getChildUrlList(); assertEquals(1, urlSet.size()); for (final RequestData requestData : urlSet.toArray(new RequestData[urlSet.size()])) { String url = requestData.getUrl(); assertTrue(url.contains("dir1/test3.txt")); }
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 18K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java
*/ public void test_robotsTxtUrlSet() { Set<String> urlSet = crawlerContext.getRobotsTxtUrlSet(); assertNotNull(urlSet); assertTrue(urlSet instanceof LruHashSet); assertTrue(urlSet.isEmpty()); // Add URLs to default set urlSet.add("http://example.com/robots.txt"); urlSet.add("http://test.com/robots.txt");
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 25.6K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/client/fs/FileSystemClientTest.java
try { fsClient.doGet("file://" + path); fail(); } catch (final ChildUrlsException e) { final Set<RequestData> urlSet = e.getChildUrlList(); for (final RequestData requestData : urlSet.toArray(new RequestData[urlSet.size()])) { String url = requestData.getUrl(); if (url.indexOf(".svn") < 0) {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java
final int depth, final String encoding) { // add url and filter final Set<String> urlSet = new HashSet<>(); final List<UrlQueue<?>> childList = childUrlList.stream() .filter(d -> StringUtil.isNotBlank(d.getUrl()) && urlSet.add(d.getUrl()) && crawlerContext.getUrlFilter().match(d.getUrl())) .map(d -> {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 12.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java
try { if (bis.read(bytes) == -1) { return false; } final String preloadDate = new String(bytes, Constants.UTF_8); if (preloadDate.indexOf("<urlset") >= 0 || preloadDate.indexOf("<sitemapindex") >= 0 || preloadDate.startsWith("http://") || preloadDate.startsWith("https://")) { // XML Sitemaps return true; }
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 14.7K bytes - Viewed (0) -
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java
robotTxtFile.deleteOnExit(); // sitemaps.xml buf = new StringBuilder(); buf.append("<?xml version=\"1.0\" encoding=\"UTF-8\"?>").append('\n'); buf.append("<urlset ").append("xmlns=\"http://www.sitemaps.org/schemas/sitemap/0.9\">").append('\n'); buf.append("<url>").append('\n'); buf.append("<loc>http://localhost:7070/index.html</loc>").append('\n');
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 6.3K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java
robotTxtFile.deleteOnExit(); // sitemaps.xml buf = new StringBuilder(); buf.append("<?xml version=\"1.0\" encoding=\"UTF-8\"?>").append('\n'); buf.append("<urlset ").append("xmlns=\"http://www.sitemaps.org/schemas/sitemap/0.9\">").append('\n'); buf.append("<url>").append('\n'); buf.append("<loc>http://localhost:7070/index.html</loc>").append('\n');
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 6.3K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java
} final Set<RequestData> urlSet = new HashSet<>(docList.size()); for (final Map<String, Object> doc : docList) { final String url = DocumentUtil.getValue(doc, fessConfig.getIndexFieldUrl(), String.class); if (StringUtil.isNotBlank(url)) { urlSet.add(RequestDataBuilder.newRequestData().get().url(url).build()); } }
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 19.1K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/SitemapsHelperTest.java
fail(); } catch (final CrawlingAccessException e) { // NOP } } public void test_parseXmlSitemaps_invalid3() { final byte[] bytes = "<urlset".getBytes(); final InputStream in = new ByteArrayInputStream(bytes); try { sitemapsHelper.parse(in); fail(); } catch (final CrawlingAccessException e) {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 9.6K bytes - Viewed (0)