Search Options

Results per page
Sort
Preferred Languages
Advance

Results 21 - 30 of 150 for Crawling (0.2 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

    import org.codelibs.fess.crawler.service.UrlQueueService;
    import org.slf4j.Logger;
    import org.slf4j.LoggerFactory;
    
    import jakarta.annotation.Resource;
    
    /**
     * Crawler manages/controls a crawling information.
     *
     * @author shinsuke
     *
     */
    public class Crawler implements Runnable, AutoCloseable {
    
        private static final Logger logger = LoggerFactory.getLogger(Crawler.class);
    
        @Resource
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:47:32 UTC 2024
    - 7.9K bytes
    - Viewed (0)
  2. test-site/app/models/ContentsCreator.java

            Queue<String> queue = getUrls();
    
            String url;
            int count = 0;
            while((url = queue.poll()) != null && count < max) {
    
                try {
                    Logger.info("crawling: " + url);
                    HttpUriRequest request = new HttpGet(url);
                    HttpResponse response = httpClient.execute(request);
                    if(response.getStatusLine().getStatusCode() != HttpStatus.SC_OK) {
    Registered: Fri Nov 08 09:08:12 UTC 2024
    - Last Modified: Fri Nov 06 08:48:32 UTC 2015
    - 3.7K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java

                    if (logger.isDebugEnabled()) {
                        logger.debug("Canceled urlQueue: {}", urlQueue);
                    }
                    // cancel crawling
                    crawlerContext.decrementAndGetAccessCount();
                    final List<UrlQueue<?>> newUrlQueueList = new ArrayList<>();
                    newUrlQueueList.add(urlQueue);
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:47:32 UTC 2024
    - 9K bytes
    - Viewed (0)
  4. src/main/resources/fess_message.properties

    errors.design_file_name_is_invalid=The file name is invalid.
    errors.design_file_is_unsupported_type=The kind of file is unsupported.
    errors.failed_to_create_crawling_config_at_wizard=Failed to create a crawling config.
    errors.design_editor_disabled=This feature is disabled.
    errors.not_found_on_file_system=Not Found: {0}
    errors.could_not_open_on_system=Could not open {0}. <br/>Please check if the file is associated with an application.
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Sat Mar 18 03:05:44 UTC 2023
    - 12.5K bytes
    - Viewed (0)
  5. src/main/resources/fess_message_en.properties

    errors.design_file_name_is_invalid=The file name is invalid.
    errors.design_file_is_unsupported_type=The kind of file is unsupported.
    errors.failed_to_create_crawling_config_at_wizard=Failed to create a crawling config.
    errors.design_editor_disabled=This feature is disabled.
    errors.not_found_on_file_system=Not Found: {0}
    errors.could_not_open_on_system=Could not open {0}. <br/>Please check if the file is associated with an application.
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Sat Mar 18 03:05:44 UTC 2023
    - 12.4K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/helper/CrawlingConfigHelper.java

                    }
                    default -> null;
                    };
                });
            } catch (final Exception e) {
                logger.warn("Failed to access a crawling config cache: {}", configId, e);
                return null;
            }
        }
    
        public OptionalThing<String> getPipeline(final String configId) {
            final CrawlingConfig config = getCrawlingConfig(configId);
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Feb 22 01:53:18 UTC 2024
    - 11.7K bytes
    - Viewed (0)
  7. src/test/java/org/codelibs/fess/it/admin/CrawlerLogTests.java

        }
    
        @Test
        void searchListTest() {
            logger.info("start searchListTest");
            testReadSearchList();
            testDeleteSearchList();
        }
    
        /**
         * Methods for a Web Crawling Job
         * */
        private static void createWebConfig() {
            final Map<String, Object> requestBody = new HashMap<>();
            final String urls = "https://www.codelibs.org/" + "\n" + "http://failure.url";
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Feb 22 01:37:57 UTC 2024
    - 9.1K bytes
    - Viewed (0)
  8. docs/de/README.md

    ![Administrationsoberfläche](https://fess.codelibs.org/_images/fess_admin_dashboard.png)
    
    Sie können in der Administrationsoberfläche (Web, Datei, Datenspeicher) Crawling-Ziele in den Crawler-Konfigurationsseiten registrieren und den Crawler manuell auf der [Scheduler-Seite](https://fess.codelibs.org/14.17/admin/scheduler-guide.html) starten.
    
    ## Migration von einem anderen Suchanbieter
    
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Sat Oct 12 07:19:47 UTC 2024
    - 7.6K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/app/web/admin/wizard/AdminWizardAction.java

                    fileConfigService.store(fConfig);
                }
                return configName;
            } catch (final Exception e) {
                logger.warn("Failed to create crawling config: {}", form.crawlingConfigPath, e);
                throwValidationError(messages -> messages.addErrorsFailedToCreateCrawlingConfigAtWizard(GLOBAL),
                        () -> asHtml(path_AdminWizard_AdminWizardConfigJsp));
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Feb 22 01:53:18 UTC 2024
    - 12.7K bytes
    - Viewed (0)
  10. src/main/resources/fess_config.properties

    page.keymatch.max.fetch.size=1000
    page.labeltype.max.fetch.size=1000
    page.roletype.max.fetch.size=1000
    page.user.max.fetch.size=1000
    page.role.max.fetch.size=1000
    page.group.max.fetch.size=1000
    page.crawling.info.param.max.fetch.size=100
    page.crawling.info.max.fetch.size=1000
    page.data.config.max.fetch.size=100
    page.web.config.max.fetch.size=100
    page.file.config.max.fetch.size=100
    page.duplicate.host.max.fetch.size=1000
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Tue Oct 01 14:13:38 UTC 2024
    - 30.9K bytes
    - Viewed (0)
Back to top