- Sort Score
- Result 10 results
- Languages All
Results 21 - 30 of 63 for ditamap (0.04 sec)
-
src/main/java/org/codelibs/fess/helper/DocumentHelper.java
* @param title the raw title text to process * @param dataMap additional data map (not currently used) * @return the normalized title, or empty string if title is null */ public String getTitle(final ResponseData responseData, final String title, final Map<String, Object> dataMap) { if (title == null) { return StringUtil.EMPTY; // empty }
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 17.2K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java
} /** * Adds a sitemap URL to the list of sitemaps. * * @param url The URL of the sitemap to be added */ public void addSitemap(final String url) { if (!sitemapList.contains(url)) { sitemapList.add(url); } } /** * Returns an array of sitemap URLs. * * @return an array of sitemap URLs */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java
final Set<RequestData> requestDataSet = new LinkedHashSet<>(); for (final Sitemap sitemap : sitemapSet.getSitemaps()) { if (sitemap != null) { requestDataSet.add(RequestDataBuilder.newRequestData().get().url(sitemap.getLoc()).build()); // TODO priority } }
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 3.4K bytes - Viewed (0) -
fess-crawler/src/test/resources/sitemaps/sitemap2.xml
<?xml version="1.0" encoding="UTF-8"?> <sitemapindex xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"> <sitemap> <loc>http://www.example.com/sitemap1.xml.gz</loc> <lastmod>2004-10-01T18:23:17+00:00</lastmod> </sitemap> <sitemap> <loc>http://www.example.com/sitemap2.xml.gz</loc> <lastmod>2005-01-01</lastmod> </sitemap>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Oct 11 02:16:55 UTC 2015 - 376 bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapFile.java
package org.codelibs.fess.crawler.entity; import org.codelibs.core.lang.StringUtil; /** * Represents a Sitemap file entry, conforming to the Sitemap XML format. * This class holds information about a single Sitemap, including its location and last modification timestamp. * It implements the {@link Sitemap} interface. * * <p> * A Sitemap file provides search engines with a list of URLs available for crawling.
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 4.4K bytes - Viewed (1) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java
import org.codelibs.core.lang.StringUtil; /** * Represents a URL entry within a sitemap. * * <p> * This class encapsulates the properties of a URL as defined in the sitemap XML format, * including its location, last modification date, change frequency, and priority. * It implements the {@link Sitemap} interface. * </p> * * <p>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 6.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java
* * @param in Input stream for a sitemap * @return a sitemap set */ public SitemapSet parse(final InputStream in) { return parse(in, true); } /** * Parses a sitemap from the given input stream. * @param in the input stream to parse * @param recursive whether to recursively parse compressed files * @return the parsed sitemap set */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 14.7K bytes - Viewed (0) -
src/main/resources/crawler/rule.xml
<component class="org.codelibs.fess.crawler.processor.impl.SitemapsResponseProcessor"> </component> </property> <postConstruct name="addRule"> <arg>"url"</arg> <arg>"http[s]?:.*sitemap[^/]*\.xml.*|http[s]?:.*sitemap[^/]*\.gz.*|http[s]?:.*sitemap[^/]*\.txt.*"</arg> </postConstruct> </component> <component name="webHtmlRule" class="org.codelibs.fess.crawler.rule.impl.RegexRule" > <property name="ruleId">"webHtmlRule"</property>
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Jun 04 08:42:49 UTC 2020 - 4.6K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/app/web/admin/general/AdminGeneralAction.java
validate(form, messages -> {}, () -> asHtml(path_AdminGeneral_AdminGeneralJsp)); final String[] toAddresses = form.notificationTo.split(","); final Map<String, Object> dataMap = new HashMap<>(); dataMap.put("hostname", systemHelper.getHostname()); final FessConfig fessConfig = ComponentUtil.getFessConfig(); final Postbox postbox = ComponentUtil.getComponent(Postbox.class); try {
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 13.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/SitemapsRule.java
* represents a valid sitemap. It uses a SitemapsHelper to validate the response body as an InputStream. * The rule checks if the URL matches the defined regex pattern and then validates the content as a sitemap. * If any exception occurs during the sitemap validation, it logs the error and returns false. * */ public class SitemapsRule extends RegexRule { /**
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 2.6K bytes - Viewed (0)