Search Options

Results per page
Sort
Preferred Languages
Advance

Results 111 - 120 of 524 for crawling (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

    import org.w3c.dom.Node;
    import org.xml.sax.InputSource;
    
    import jakarta.annotation.Resource;
    
    /**
     * The {@code HtmlTransformer} class is responsible for transforming HTML responses
     * during the crawling process. It extracts data, identifies child URLs, and handles
     * character set encoding.
     * <p>
     * This class extends {@link AbstractTransformer} and utilizes various helper classes
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 28.5K bytes
    - Viewed (0)
  2. src/test/java/org/codelibs/fess/indexer/IndexUpdaterTest.java

        public void test_init_withIngestFactory() {
            ComponentUtil.register(ingestFactory, "ingestFactory");
            indexUpdater.init();
            assertNotNull(indexUpdater);
        }
    
        // Test destroy when crawling is not finished
        public void test_destroy_notFinished() {
            final List<Crawler> crawlerList = new ArrayList<>();
            final TestCrawler crawler = new TestCrawler();
            crawlerList.add(crawler);
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Tue Aug 19 14:09:36 UTC 2025
    - 33K bytes
    - Viewed (0)
  3. src/test/java/org/codelibs/fess/exec/CrawlerTest.java

            // We just verify that the crawl completes with EXIT_OK
            assertTrue("Crawler should complete", result == Constants.EXIT_OK);
        }
    
        // Test concurrent crawling
        public void test_doCrawl_concurrentWebAndData() {
            final List<String> executionOrder = Collections.synchronizedList(new ArrayList<>());
    
            WebFsIndexHelper mockWebHelper = new WebFsIndexHelper() {
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Tue Aug 19 14:09:36 UTC 2025
    - 30.5K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/crawler/transformer/AbstractFessFileTransformer.java

            }
            return false;
        }
    
        /**
         * Create the parameters for extraction.
         * @param responseData The response data.
         * @param crawlingConfig The crawling configuration.
         * @return The parameters for extraction.
         */
        protected Map<String, String> createExtractParams(final ResponseData responseData, final CrawlingConfig crawlingConfig) {
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 25.6K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/TransformerTest.java

            transformer.addTransformationRule("<[^>]+>", ""); // Remove HTML tags
            transformer.addTransformationRule("\\s+", " "); // Normalize whitespace
    
            // Simulate crawling response
            ResponseData responseData = new ResponseData();
            responseData.setUrl("http://example.com/page.html");
            responseData.setParentUrl("http://example.com/");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 28K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/mylasta/action/FessMessages.java

        public static final String ERRORS_design_file_is_unsupported_type = "{errors.design_file_is_unsupported_type}";
    
        /** The key of the message: Failed to create a crawling config at a wizard. */
        public static final String ERRORS_failed_to_create_crawling_config_at_wizard = "{errors.failed_to_create_crawling_config_at_wizard}";
    
        /** The key of the message: This feature is disabled. */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sat Jul 05 02:36:47 UTC 2025
    - 119.6K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

                        buf.append(e.getCause().getMessage());
                    }
                    logger.info(buf.toString());
                } else if (logger.isDebugEnabled()) {
                    logger.debug("Crawling Access Exception at {}", url, e);
                }
            }
    
            // request header
            for (final Header header : requestHeaderList) {
                httpRequest.addHeader(header);
            }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 52.2K bytes
    - Viewed (0)
  8. android/guava-tests/test/com/google/common/io/testdata/alice_in_wonderland.txt

    to learn?'
    
      `Well, there was Mystery,' the Mock Turtle replied, counting
    off the subjects on his flappers, `--Mystery, ancient and modern,
    with Seaography:  then Drawling--the Drawling-master was an old
    conger-eel, that used to come once a week:  HE taught us
    Drawling, Stretching, and Fainting in Coils.'
    
      `What was THAT like?' said Alice.
    
      `Well, I can't show it you myself,' the Mock Turtle said:  `I'm
    Registered: Fri Sep 05 12:43:10 UTC 2025
    - Last Modified: Fri Apr 21 02:27:51 UTC 2017
    - 145.2K bytes
    - Viewed (0)
  9. src/archive/tar/testdata/trailing-slash.tar

    Caio Marcelo de Oliveira Filho <******@****.***> 1514852203 -0800
    Registered: Tue Sep 09 11:13:09 UTC 2025
    - Last Modified: Tue Feb 13 18:36:49 UTC 2018
    - 2.5K bytes
    - Viewed (0)
  10. src/archive/zip/testdata/test-trailing-junk.zip

    Russ Cox <******@****.***> 1410149331 -0400
    Registered: Tue Sep 09 11:13:09 UTC 2025
    - Last Modified: Mon Sep 08 04:08:51 UTC 2014
    - 1.2K bytes
    - Viewed (0)
Back to top