Search Options

Display Count
Sort
Preferred Language
Advanced Search

Results 11 - 20 of 399 for crawlen (0.04 seconds)

  1. fess-crawler-lasta/src/main/resources/crawler.xml

    <components namespace="fessCrawler">
    	<include path="crawler/container.xml"/>
    	<include path="crawler/client.xml"/>
    	<include path="crawler/rule.xml"/>
    	<include path="crawler/filter.xml"/>
    	<include path="crawler/interval.xml"/>
    	<include path="crawler/extractor.xml"/>
    	<include path="crawler/mimetype.xml"/>
    	<include path="crawler/encoding.xml"/>
    	<include path="crawler/urlconverter.xml"/>
    	<include path="crawler/log.xml"/>
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Tue Nov 28 13:40:25 GMT 2017
    - 1.7K bytes
    - Click Count (0)
  2. src/main/java/org/codelibs/fess/ds/callback/FileListIndexUpdateCallbackImpl.java

    import org.codelibs.fess.Constants;
    import org.codelibs.fess.crawler.builder.RequestDataBuilder;
    import org.codelibs.fess.crawler.client.CrawlerClient;
    import org.codelibs.fess.crawler.client.CrawlerClientFactory;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    import org.codelibs.fess.crawler.exception.ChildUrlsException;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 29.7K bytes
    - Click Count (3)
  3. src/main/resources/mail/crawler.dfmail

    /*
     [Crawler Notification]
     Crawler notification mail.
    */
    subject: [FESS] Crawler completed: /*pmb.hostname*/
    >>>
    --- Server Info ---
    Host Name: /*pmb.hostname:orElse('Unknown')*/
    Job Name: /*pmb.jobname:orElse('Unknown')*/
    
    --- Web/FileSystem Crawler ---
    Start Time: /*pmb.webFsCrawlStartTime:orElse('-')*/
    End Time:   /*pmb.webFsCrawlEndTime:orElse('-')*/
    Exec Time:  /*pmb.webFsCrawlExecTime:orElse('-')*/ ms
    
    --- Web/FileSystem Indexer ---
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Wed Jan 15 22:05:20 GMT 2020
    - 1K bytes
    - Click Count (0)
  4. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                crawler1.getCrawlerContext().setMaxAccessCount(maxCount);
                crawler1.getCrawlerContext().setNumOfThread(numOfThread);
    
                final Crawler crawler2 = getComponent(Crawler.class);
                crawler2.setBackground(true);
                ((UrlFilterImpl) crawler2.urlFilter).setIncludeFilteringPattern("$1$2$3.*");
                crawler2.addUrl(url2);
                crawler2.getCrawlerContext().setMaxAccessCount(maxCount);
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Thu Jan 15 01:11:43 GMT 2026
    - 7.8K bytes
    - Click Count (0)
  5. src/main/java/org/codelibs/fess/helper/WebFsIndexHelper.java

    import org.codelibs.fess.Constants;
    import org.codelibs.fess.crawler.Crawler;
    import org.codelibs.fess.crawler.CrawlerContext;
    import org.codelibs.fess.crawler.CrawlerStatus;
    import org.codelibs.fess.crawler.interval.FessIntervalController;
    import org.codelibs.fess.crawler.service.impl.OpenSearchDataService;
    import org.codelibs.fess.crawler.service.impl.OpenSearchUrlFilterService;
    import org.codelibs.fess.crawler.service.impl.OpenSearchUrlQueueService;
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Nov 28 16:29:12 GMT 2025
    - 25K bytes
    - Click Count (0)
  6. CLAUDE.md

    │   ├── config/                # Config index (crawl configs, schedules)
    │   ├── log/                   # Log index (search logs, click logs)
    │   └── user/                  # User index (users, groups, roles)
    ├── helper/                    # Cross-cutting utilities (~40+ helpers)
    ├── crawler/                   # Crawling engine (processor, transformer, service)
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Thu Mar 19 09:48:10 GMT 2026
    - 7.8K bytes
    - Click Count (0)
  7. src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java

    import org.codelibs.fess.app.service.FailureUrlService;
    import org.codelibs.fess.crawler.builder.RequestDataBuilder;
    import org.codelibs.fess.crawler.client.CrawlerClient;
    import org.codelibs.fess.crawler.entity.RequestData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.log.LogType;
    import org.codelibs.fess.exception.ContainerNotAvailableException;
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Thu Dec 11 09:47:03 GMT 2025
    - 19.5K bytes
    - Click Count (0)
  8. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/container/LastaCrawlerContainerTest.java

            // Verify that multiple components can be retrieved
            final Crawler crawler1 = crawlerContainer.getComponent("crawler");
            final Crawler crawler2 = crawlerContainer.getComponent("crawler");
    
            // They should be different instances (prototype scope)
            assertNotNull(crawler1);
            assertNotNull(crawler2);
        }
    
        @Test
        public void test_isLastaCrawlerContainer() {
    Created: Sun Apr 12 03:50:13 GMT 2026
    - Last Modified: Fri Jan 16 13:52:11 GMT 2026
    - 2.7K bytes
    - Click Count (0)
  9. src/main/java/org/codelibs/fess/crawler/processor/FessResponseProcessor.java

     */
    package org.codelibs.fess.crawler.processor;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.entity.AccessResult;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    import org.codelibs.fess.crawler.processor.impl.DefaultResponseProcessor;
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Thu Jul 17 08:28:31 GMT 2025
    - 3.7K bytes
    - Click Count (0)
  10. src/test/java/org/codelibs/fess/exec/CrawlerTest.java

            Crawler.Options options = new Crawler.Options();
            options.sessionId = "test-session";
            options.fileConfigIds = "file1";
    
            int result = crawler.doCrawl(options);
            assertEquals(Constants.EXIT_OK, result);
        }
    
        @Test
        public void test_doCrawl_withDataConfigIds() {
            Crawler.Options options = new Crawler.Options();
    Created: Tue Mar 31 13:07:34 GMT 2026
    - Last Modified: Fri Mar 13 23:01:26 GMT 2026
    - 30.8K bytes
    - Click Count (0)
Back to Top