Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 20 for passes (0.02 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/XmlUtil.java

                spfactory.setFeature(Constants.FEATURE_EXTERNAL_PARAMETER_ENTITIES, false);
                // create a sax parser
                final SAXParser parser = spfactory.newSAXParser();
                try {
                    parser.setProperty(XMLConstants.ACCESS_EXTERNAL_DTD, StringUtil.EMPTY);
                    parser.setProperty(XMLConstants.ACCESS_EXTERNAL_SCHEMA, StringUtil.EMPTY);
                } catch (final Exception e) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.4K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

            // Default constructor
        }
    
        /**
         * Parses a robots.txt file from the given input stream using UTF-8 encoding.
         * @param stream the input stream to parse
         * @return the parsed RobotsTxt object, or null if disabled
         */
        public RobotsTxt parse(final InputStream stream) {
            return parse(stream, Constants.UTF_8);
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/suggest/index/contents/ContentsParser.java

         * @param normalizer the normalizer to use for normalizing values
         * @return a list of suggest items parsed from the query log
         */
        List<SuggestItem> parseQueryLog(QueryLog queryLog, String[] fields, String[] tagFieldNames, String roleFieldName,
                ReadingConverter readingConverter, Normalizer normalizer);
    
        /**
         * Parses a document and extracts suggest items based on the provided fields and converters.
         *
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sat Mar 15 06:51:20 UTC 2025
    - 4.1K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

    import jakarta.annotation.Resource;
    
    /**
     * A response processor implementation that handles sitemaps.
     * It parses the response body as a SitemapSet, extracts URLs from the sitemaps,
     * and adds them as child URLs to be crawled.
     *
     * <p>
     * This class uses a {@link SitemapsHelper} to parse the sitemap XML or text.
     * It then iterates through the sitemaps in the SitemapSet, extracts the URL
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

            final DOMParser parser = getDomParser();
            try (final Reader reader = new StringReader(content)) {
                parser.parse(new InputSource(reader));
            } catch (final Exception e) {
                logger.warn("Failed to parse the content.", e);
                return new ExtractData(extractString(content));
            }
    
            final Document document = parser.getDocument();
            try {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  6. src/test/java/org/codelibs/opensearch/extension/analysis/SynonymLoader.java

                SynonymMap.Builder parser = null;
    
                if ("wordnet".equalsIgnoreCase(settings.get("format"))) {
                    parser = new WordnetSynonymParser(true, expand, analyzer);
                    ((WordnetSynonymParser) parser).parse(rulesReader);
                } else {
                    parser = new SolrSynonymParser(true, expand, analyzer);
                    ((SolrSynonymParser) parser).parse(rulesReader);
                }
    
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sun May 18 02:59:16 UTC 2025
    - 6.7K bytes
    - Viewed (1)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PasswordBasedExtractor.java

        /** Map of regex patterns to passwords for static password configuration. */
        protected Map<Pattern, String> passwordMap = new HashMap<>();
    
        /** Cache for parsed password configurations from extraction parameters. */
        private final Map<String, List<Pair<Pattern, String>>> configPasswordMap = new ConcurrentHashMap<>();
    
        /**
         * Creates a new PasswordBasedExtractor instance.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 5.1K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/SitemapsHelperTest.java

            try {
                sitemapsHelper.parse(in);
                fail();
            } catch (final CrawlingAccessException e) {
                // NOP
            }
        }
    
        public void test_parseXmlSitemaps_invalid2() {
            final byte[] bytes = "test".getBytes();
            final InputStream in = new ByteArrayInputStream(bytes);
    
            try {
                sitemapsHelper.parse(in);
                fail();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 9.6K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/MultipleCrawlingAccessException.java

    /**
     * An exception that indicates multiple crawling access exceptions occurred.
     * This exception holds an array of Throwable objects representing the individual causes.
     * It extends CrawlingAccessException and provides methods to print the stack traces of all causes.
     *
     */
    public class MultipleCrawlingAccessException extends CrawlingAccessException {
    
        private static final long serialVersionUID = 1L;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.5K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java

         * when making decisions, they may crawl pages marked "hourly" less
         * frequently than that, and they may crawl pages marked "yearly" more
         * frequently than that. Crawlers may periodically crawl pages marked
         * "never" so that they can handle unexpected changes to those pages.
         */
        private String changefreq;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
Back to top