Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 30 for Sparse (0.02 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java

         */
        public SitemapSet parse(final InputStream in) {
            return parse(in, true);
        }
    
        /**
         * Parses a sitemap from the given input stream.
         * @param in the input stream to parse
         * @param recursive whether to recursively parse compressed files
         * @return the parsed sitemap set
         */
        protected SitemapSet parse(final InputStream in, final boolean recursive) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.7K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

            // Default constructor
        }
    
        /**
         * Parses a robots.txt file from the given input stream using UTF-8 encoding.
         * @param stream the input stream to parse
         * @return the parsed RobotsTxt object, or null if disabled
         */
        public RobotsTxt parse(final InputStream stream) {
            return parse(stream, Constants.UTF_8);
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/XmlUtil.java

                spfactory.setFeature(Constants.FEATURE_EXTERNAL_PARAMETER_ENTITIES, false);
                // create a sax parser
                final SAXParser parser = spfactory.newSAXParser();
                try {
                    parser.setProperty(XMLConstants.ACCESS_EXTERNAL_DTD, StringUtil.EMPTY);
                    parser.setProperty(XMLConstants.ACCESS_EXTERNAL_SCHEMA, StringUtil.EMPTY);
                } catch (final Exception e) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.4K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

            try (final InputStream is = responseData.getResponseBody()) {
                final DOMParser parser = getDomParser();
                parser.parse(new InputSource(is));
                final Document document = parser.getDocument();
                // base href
                final String baseHref = getBaseHref(document);
                URI uri;
                try {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 28.5K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

        }
    
        /**
         * Creates a parse context.
         *
         * @param parser A parser.
         * @param params A map of parameters.
         * @return a parse context.
         */
        protected ParseContext createParseContext(final Parser parser, final Map<String, String> params) {
            final ParseContext parseContext = new ParseContext();
            parseContext.set(Parser.class, parser);
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

            final DOMParser parser = getDomParser();
            try (final Reader reader = new StringReader(content)) {
                parser.parse(new InputSource(reader));
            } catch (final Exception e) {
                logger.warn("Failed to parse the content.", e);
                return new ExtractData(extractString(content));
            }
    
            final Document document = parser.getDocument();
            try {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java

                final String enc = getEncoding(bis);
    
                final DOMParser parser = getDomParser();
                final InputSource inputSource = new InputSource(bis);
                inputSource.setEncoding(enc);
                parser.parse(inputSource);
                final Document document = parser.getDocument();
    
                final StringBuilder buf = new StringBuilder(255);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/suggest/util/SuggestUtil.java

            try {
                final StandardQueryParser parser = new StandardQueryParser();
                parser.setDefaultOperator(StandardQueryConfigHandler.Operator.AND);
    
                // Parse with the first field if available, otherwise use "default"
                String defaultField = fields != null && fields.length > 0 ? fields[0] : "default";
                termQueryList = getTermQueryList(parser.parse(q, defaultField), fields);
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Mon Sep 01 13:33:03 UTC 2025
    - 17.4K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

    import jakarta.annotation.Resource;
    
    /**
     * A response processor implementation that handles sitemaps.
     * It parses the response body as a SitemapSet, extracts URLs from the sitemaps,
     * and adds them as child URLs to be crawled.
     *
     * <p>
     * This class uses a {@link SitemapsHelper} to parse the sitemap XML or text.
     * It then iterates through the sitemaps in the SitemapSet, extracts the URL
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java

            final DOMParser parser = getDomParser();
            try (final InputStream in = responseData.getResponseBody()) {
                final InputSource is = new InputSource(in);
                if (responseData.getCharSet() != null) {
                    is.setEncoding(responseData.getCharSet());
                }
                parser.parse(is);
            } catch (final Exception e) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.1K bytes
    - Viewed (0)
Back to top