Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 28 for unparse (0.03 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/SitemapsHelperTest.java

            try {
                sitemapsHelper.parse(in);
                fail();
            } catch (final CrawlingAccessException e) {
                // NOP
            }
        }
    
        public void test_parseXmlSitemaps_invalid2() {
            final byte[] bytes = "test".getBytes();
            final InputStream in = new ByteArrayInputStream(bytes);
    
            try {
                sitemapsHelper.parse(in);
                fail();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 9.6K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

         * @param stream the input stream to parse
         * @return the parsed RobotsTxt object, or null if disabled
         */
        public RobotsTxt parse(final InputStream stream) {
            return parse(stream, Constants.UTF_8);
        }
    
        /**
         * Parses a robots.txt file from the given input stream using the specified character encoding.
         * @param stream the input stream to parse
         * @param charsetName the character encoding to use
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java

         */
        public SitemapSet parse(final InputStream in) {
            return parse(in, true);
        }
    
        /**
         * Parses a sitemap from the given input stream.
         * @param in the input stream to parse
         * @param recursive whether to recursively parse compressed files
         * @return the parsed sitemap set
         */
        protected SitemapSet parse(final InputStream in, final boolean recursive) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.7K bytes
    - Viewed (0)
  4. src/test/java/org/codelibs/opensearch/extension/kuromoji/index/analysis/KuromojiTokenizerFactory.java

            nBestCost = settings.getAsInt(NBEST_COST, -1);
            nBestExamples = settings.get(NBEST_EXAMPLES);
        }
    
        private static String parse(String rule, Set<String> dup) {
            String[] values = CSVUtil.parse(rule);
            if (dup.add(values[0]) == false) {
                throw new IllegalArgumentException("Found duplicate term [" + values[0] + "] in user dictionary.");
            }
            return rule;
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sat Mar 15 06:51:20 UTC 2025
    - 4.7K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

            } finally {
                FileUtil.deleteInBackground(tempFile);
            }
        }
    
        /**
         * Creates a parse context.
         *
         * @param parser A parser.
         * @param params A map of parameters.
         * @return a parse context.
         */
        protected ParseContext createParseContext(final Parser parser, final Map<String, String> params) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/suggest/index/contents/ContentsParser.java

        /**
         * Parses the given query log and returns a list of suggest items.
         *
         * @param queryLog the query log to parse
         * @param fields the fields to extract from the query log
         * @param tagFieldNames the names of the fields to use as tags
         * @param roleFieldName the name of the field to use for roles
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sat Mar 15 06:51:20 UTC 2025
    - 4.1K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/RobotsTxtHelperTest.java

        }
    
        public void testParse() {
            RobotsTxt robotsTxt;
            final InputStream in = RobotsTxtHelperTest.class.getResourceAsStream("robots.txt");
            try {
                robotsTxt = robotsTxtHelper.parse(in);
            } finally {
                CloseableUtil.closeQuietly(in);
            }
    
            for (String userAgent : new String[] { "FessCrawler", "FessCrawler/1.0", "Mozilla FessCrawler" }) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 5.9K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/XmlUtil.java

                } catch (final Exception e) {
                    if (logger.isDebugEnabled()) {
                        logger.debug("Failed to set a property.", e);
                    }
                }
                // parse a content
                parser.parse(is, handler);
    
                return handler.getDataMap();
            } catch (final Exception e) {
                throw new CrawlerSystemException("Could not create a data map from XML content.", e);
            }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.4K bytes
    - Viewed (0)
  9. src/test/java/org/codelibs/opensearch/extension/analysis/SynonymLoader.java

                    parser = new WordnetSynonymParser(true, expand, analyzer);
                    ((WordnetSynonymParser) parser).parse(rulesReader);
                } else {
                    parser = new SolrSynonymParser(true, expand, analyzer);
                    ((SolrSynonymParser) parser).parse(rulesReader);
                }
    
                final SynonymMap localSynonymMap = parser.build();
                if (localSynonymMap.fst == null) {
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sun May 18 02:59:16 UTC 2025
    - 6.7K bytes
    - Viewed (1)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

     * It parses the response body as a SitemapSet, extracts URLs from the sitemaps,
     * and adds them as child URLs to be crawled.
     *
     * <p>
     * This class uses a {@link SitemapsHelper} to parse the sitemap XML or text.
     * It then iterates through the sitemaps in the SitemapSet, extracts the URL
     * from each sitemap, and creates a new {@link RequestData} object for each URL.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
Back to top