- Sort Score
- Result 10 results
- Languages All
Results 11 - 20 of 64 for ditamap (0.05 sec)
-
src/main/java/org/codelibs/fess/helper/CrawlingInfoHelper.java
* * @param dataMap the document data map containing URL, roles, and virtual host information * @return a unique hashed ID string for the document */ public String generateId(final Map<String, Object> dataMap) { final FessConfig fessConfig = ComponentUtil.getFessConfig(); final String url = (String) dataMap.get(fessConfig.getIndexFieldUrl());Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 15.2K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessorTest.java
ResponseData responseData = new ResponseData(); byte[] content = "<sitemap></sitemap>".getBytes(); responseData.setResponseBody(content); SitemapUrl sitemap = new SitemapUrl(); sitemap.setLoc("https://example.com/page1"); SitemapSet sitemapSet = new SitemapSet(); sitemapSet.addSitemap(sitemap); when(crawlerContainer.getComponent("sitemapsHelper")).thenReturn(sitemapsHelper);
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Thu Nov 13 13:29:22 UTC 2025 - 12K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java
/** * Represents a URL entry within a sitemap. * * <p> * This class encapsulates the properties of a URL as defined in the sitemap XML format, * including its location, last modification date, change frequency, and priority. * It also supports sitemap extensions such as images, videos, news, and alternate links. * It implements the {@link Sitemap} interface. * </p> * * <p>Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Thu Nov 13 13:34:36 UTC 2025 - 9.1K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/helper/DocumentHelper.java
* @param title the raw title text to process * @param dataMap additional data map (not currently used) * @return the normalized title, or empty string if title is null */ public String getTitle(final ResponseData responseData, final String title, final Map<String, Object> dataMap) { if (title == null) { return StringUtil.EMPTY; // empty }Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Fri Nov 28 16:29:12 UTC 2025 - 17.4K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/SitemapsRuleTest.java
sitemapsRule.addRule("url", Pattern.compile(".*sitemap.*")); assertTrue(sitemapsRule.match(responseData)); InputStream is = responseData.getResponseBody(); assertTrue(is instanceof InputStream); CloseableUtil.closeQuietly(responseData); } private void assertMatchFalse(ResponseData responseData) { sitemapsRule.addRule("url", Pattern.compile(".*sitemap.*"));
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 4.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapSet.java
sitemapList.add(sitemap); } /** * Removes a sitemap from this set. * @param sitemap the sitemap to remove */ public void removeSitemap(final Sitemap sitemap) { sitemapList.remove(sitemap); } /** * Gets all sitemaps in this set as an array. * @return an array of sitemaps */ public Sitemap[] getSitemaps() {
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2.9K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/ds/callback/IndexUpdateCallback.java
* * @param paramMap the data store parameters containing configuration and metadata * @param dataMap the document data to be indexed as key-value pairs */ void store(DataStoreParams paramMap, Map<String, Object> dataMap); /** * Returns the total number of documents processed by this callback. * * @return the document count */Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 1.8K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/SitemapsHelperTest.java
+ " <loc>http://www.example.com/sitemap2.xml</loc>\n" + " </sitemap>\n" + "</sitemapindex>"; final InputStream in = new ByteArrayInputStream(xml.getBytes()); final SitemapSet sitemapSet = sitemapsHelper.parse(in); final Sitemap[] sitemaps = sitemapSet.getSitemaps();
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Mon Nov 24 03:59:47 UTC 2025 - 36.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java
final Set<RequestData> requestDataSet = new LinkedHashSet<>(); for (final Sitemap sitemap : sitemapSet.getSitemaps()) { if (sitemap != null) { requestDataSet.add(RequestDataBuilder.newRequestData().get().url(sitemap.getLoc()).build()); // TODO priority } }
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.4K bytes - Viewed (0) -
fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots_malformed.txt
User-agent: Bot1 User-agent: Bot2 User-agent: Bot3 Disallow: /shared/ # Case 11: Sitemap with various formats Sitemap: http://example.com/sitemap.xml sitemap: http://example.com/sitemap2.xml SITEMAP: http://example.com/sitemap3.xml Sitemap: # empty sitemap (should be ignored) Sitemap: not-a-valid-url # Case 12: Malformed lines that should be completely ignored This line is completely invalid :NoKey
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Fri Nov 14 12:52:01 UTC 2025 - 2.6K bytes - Viewed (0)