Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 26 for urlQueue (0.07 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/UrlQueue.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.entity;
    
    /**
     * @author shinsuke
     *
     */
    public interface UrlQueue<IDTYPE> {
    
        IDTYPE getId();
    
        void setId(IDTYPE id);
    
        String getSessionId();
    
        void setSessionId(String sessionId);
    
        String getMethod();
    
        void setMethod(String method);
    
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Mon Nov 04 07:44:18 UTC 2024
    - 1.4K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/helper/CrawlerLogHelper.java

            if (objs.length > 1 && objs[1] instanceof final UrlQueue<?> urlQueue) {
                ComponentUtil.getCrawlerStatsHelper().begin(urlQueue);
            }
        }
    
        @Override
        protected void processCleanupCrawling(final Object... objs) {
            super.processCleanupCrawling(objs);
            if (objs.length > 1 && objs[1] instanceof final UrlQueue<?> urlQueue) {
                ComponentUtil.getCrawlerStatsHelper().done(urlQueue);
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Fri Oct 11 21:11:58 UTC 2024
    - 7.3K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/LogHelperImpl.java

            final UrlQueue<?> urlQueue = (UrlQueue<?>) objs[1];
            final Throwable e = (Throwable) objs[2];
            logger.error("Crawling Exception at " + urlQueue.getUrl(), e);
        }
    
        protected void processCrawlingAccessException(final Object... objs) {
            // CrawlerContext crawlerContext = (CrawlerContext) objs[0];
            final UrlQueue<?> urlQueue = (UrlQueue<?>) objs[1];
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 10.3K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

            }
        }
    
        protected boolean isValid(final UrlQueue<?> urlQueue) {
            if (urlQueue == null || StringUtil.isBlank(urlQueue.getUrl())
                    || crawlerContext.getMaxDepth() >= 0 && urlQueue.getDepth() > crawlerContext.getMaxDepth()) {
                return false;
            }
    
            // url filter
            if (crawlerContext.urlFilter.match(urlQueue.getUrl())) {
                return true;
            }
    
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Sat Oct 12 01:41:37 UTC 2024
    - 15.5K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                assertEquals(maxCount, dataService.getCount(sessionId2));
    
                UrlQueue urlQueue;
                while ((urlQueue = urlQueueService.poll(sessionId1)) != null) {
                    assertTrue(urlQueue.getUrl().startsWith(url1));
                }
                while ((urlQueue = urlQueueService.poll(sessionId2)) != null) {
                    assertTrue(urlQueue.getUrl().startsWith(url2));
                }
    
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 18K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/UrlQueueServiceImpl.java

                final UrlQueueImpl<Long> urlQueue = new UrlQueueImpl<>();
                urlQueue.setSessionId(sessionId);
                urlQueue.setMethod(Constants.GET_METHOD);
                urlQueue.setUrl(url);
                urlQueue.setUrl(url);
                urlQueue.setDepth(0);
                urlQueue.setCreateTime(SystemUtil.currentTimeMillis());
                urlQueueList.add(urlQueue);
            }
        }
    
        /*
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:47:32 UTC 2024
    - 7.5K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java

                    if (logger.isDebugEnabled()) {
                        logger.debug("Canceled urlQueue: {}", urlQueue);
                    }
                    // cancel crawling
                    crawlerContext.decrementAndGetAccessCount();
                    final List<UrlQueue<?>> newUrlQueueList = new ArrayList<>();
                    newUrlQueueList.add(urlQueue);
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:47:32 UTC 2024
    - 9K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java

        protected void storeChildUrlsToQueue(final UrlQueue<?> urlQueue, final Set<RequestData> childUrlSet) {
            if (childUrlSet != null) {
                // add an url
                try {
                    storeChildUrls(childUrlSet.stream().filter(rd -> StringUtil.isNotBlank(rd.getUrl())).collect(Collectors.toSet()),
                            urlQueue.getUrl(), urlQueue.getDepth() != null ? urlQueue.getDepth() + 1 : 1);
    Registered: Thu Oct 31 13:40:30 UTC 2024
    - Last Modified: Thu Feb 22 01:37:57 UTC 2024
    - 14.6K bytes
    - Viewed (0)
  9. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueServiceTest.java

            final OpenSearchUrlQueue urlQueue = new OpenSearchUrlQueue();
            urlQueue.setCreateTime(System.currentTimeMillis());
            urlQueue.setDepth(1);
            urlQueue.setMethod("GET");
            urlQueue.setSessionId("id1");
            urlQueue.setUrl("http://www.id1.com/");
    
            urlQueueService.insert(urlQueue);
    
            final OpenSearchUrlQueue urlQueue2 = new OpenSearchUrlQueue();
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 5.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CrawlingParameterUtil.java

            if (urlQueue == null) {
                URL_QUEUE_THREAD_LOCAL.remove();
            } else {
                URL_QUEUE_THREAD_LOCAL.set(urlQueue);
            }
        }
    
        public static CrawlerContext getCrawlerContext() {
            return ROBOT_CONTEXT_THREAD_LOCAL.get();
        }
    
        public static void setCrawlerContext(final CrawlerContext crawlerContext) {
            if (crawlerContext == null) {
    Registered: Sun Nov 10 03:50:12 UTC 2024
    - Last Modified: Thu Feb 22 01:36:27 UTC 2024
    - 2.9K bytes
    - Viewed (0)
Back to top