Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 8 of 8 for parsing (0.07 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

     *
     * @author bowez
     * @author shinsuke
     *
     */
    public class RobotsTxtHelper {
    
        /** Pattern for parsing user-agent records. */
        protected static final Pattern USER_AGENT_RECORD =
                Pattern.compile("^user-agent:\\s*([^\\t\\n\\x0B\\f\\r]+)\\s*$", Pattern.CASE_INSENSITIVE);
    
        /** Pattern for parsing disallow records. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

     * passed to a {@link ChildUrlsException} to be processed by the crawler.
     * </p>
     *
     * <p>
     * The class also handles potential {@link IOException}s that may occur during
     * the parsing of the response body.
     * </p>
     */
    public class SitemapsResponseProcessor implements ResponseProcessor {
        /** The crawler container for component lookup. */
        @Resource
        protected CrawlerContainer crawlerContainer;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/XmlUtil.java

         *
         * @param accessResultData the data containing the XML content to be parsed
         * @return a map containing the parsed data from the XML content
         * @throws CrawlerSystemException if an error occurs while parsing the XML content
         */
        public static Map<String, Object> getDataMap(final AccessResultData<?> accessResultData) {
            // create input source
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.4K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/suggest/index/contents/ContentsParser.java

    import org.codelibs.fess.suggest.entity.SuggestItem;
    import org.codelibs.fess.suggest.index.contents.querylog.QueryLog;
    import org.codelibs.fess.suggest.normalizer.Normalizer;
    
    /**
     * Interface for parsing content and creating suggest items.
     */
    public interface ContentsParser {
        /**
         * Parses the given search words and creates a SuggestItem.
         *
         * @param words the array of search words
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sat Mar 15 06:51:20 UTC 2025
    - 4.1K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

                logger.warn("Failed to parse the content by {}", path, e);
                return StringUtil.EMPTY_STRINGS;
            }
    
        }
    
        /**
         * Creates and configures a DOM parser for parsing HTML content.
         *
         * @return a configured DOMParser instance
         * @throws CrawlerSystemException if the parser configuration is invalid
         */
        protected DOMParser getDomParser() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcConnectionMonitorTarget.java

     * <ul>
     *   <li>{@link #expired()}: Handles the expiration of connections by closing expired and idle connections.</li>
     * </ul>
     *
     * <p>Logging:</p>
     * <ul>
     *   <li>Logs a warning if the clientConnectionManager is null.</li>
     *   <li>Logs a warning if an exception occurs during connection monitoring.</li>
     * </ul>
     *
     */
    public class HcConnectionMonitorTarget implements TimeoutTarget {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.3K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/CrawlingAccessException.java

         */
        public static final String DEBUG = "DEBUG";
    
        /**
         * Log level constant for info messages.
         */
        public static final String INFO = "INFO";
    
        /**
         * Log level constant for warning messages.
         */
        public static final String WARN = "WARN";
    
        /**
         * Log level constant for error messages.
         */
        public static final String ERROR = "ERROR";
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.8K bytes
    - Viewed (0)
  8. src/test/java/org/codelibs/fess/suggest/index/contents/document/ESSourceReaderTest.java

            int count = 0;
            int prev = -1;
            Map<String, Object> source;
            while ((source = reader.read()) != null) {
                int current = Integer.parseInt(source.get("field2").toString());
                assertTrue(prev < current);
                prev = current;
                count++;
            }
            assertEquals(num, count);
    
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 9K bytes
    - Viewed (0)
Back to top