Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 28 for urlQueue (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/UrlQueue.java

     */
    package org.codelibs.fess.crawler.entity;
    
    /**
     * The UrlQueue interface represents a queue of URLs to be processed by a web crawler.
     * It provides methods to get and set various properties of a URL queue entry.
     *
     * @param <IDTYPE> the type of the identifier for the URL queue entry
     */
    public interface UrlQueue<IDTYPE> {
    
        /**
         * Retrieves the unique identifier of the URL queue.
         *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 4.3K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/helper/CrawlerLogHelper.java

            if (objs.length > 1 && objs[1] instanceof final UrlQueue<?> urlQueue) {
                ComponentUtil.getCrawlerStatsHelper().begin(urlQueue);
            }
        }
    
        @Override
        protected void processCleanupCrawling(final Object... objs) {
            super.processCleanupCrawling(objs);
            if (objs.length > 1 && objs[1] instanceof final UrlQueue<?> urlQueue) {
                ComponentUtil.getCrawlerStatsHelper().done(urlQueue);
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 8.2K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/LogHelperImpl.java

         * @param objs the log objects (should contain UrlQueue and thread check count)
         */
        protected void processNoUrlInQueue(final Object... objs) {
            // CrawlerContext crawlerContext = (CrawlerContext) objs[0];
            final UrlQueue<?> urlQueue = (UrlQueue<?>) objs[1];
            final Integer threadCheckCount = (Integer) objs[2];
            if (logger.isDebugEnabled()) {
                if (urlQueue != null && urlQueue.getUrl() != null) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                assertEquals(maxCount, dataService.getCount(sessionId2));
    
                UrlQueue urlQueue;
                while ((urlQueue = urlQueueService.poll(sessionId1)) != null) {
                    assertTrue(urlQueue.getUrl().startsWith(url1));
                }
                while ((urlQueue = urlQueueService.poll(sessionId2)) != null) {
                    assertTrue(urlQueue.getUrl().startsWith(url2));
                }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/UrlQueueServiceImpl.java

            synchronized (urlQueueList) {
                final UrlQueueImpl<Long> urlQueue = new UrlQueueImpl<>();
                urlQueue.setSessionId(sessionId);
                urlQueue.setMethod(Constants.GET_METHOD);
                urlQueue.setUrl(url);
                urlQueue.setDepth(0);
                urlQueue.setCreateTime(SystemUtil.currentTimeMillis());
                urlQueueList.add(urlQueue);
            }
        }
    
        /*
         * (non-Javadoc)
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  6. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueServiceTest.java

            final OpenSearchUrlQueue urlQueue = new OpenSearchUrlQueue();
            urlQueue.setCreateTime(System.currentTimeMillis());
            urlQueue.setDepth(1);
            urlQueue.setMethod("GET");
            urlQueue.setSessionId("id1");
            urlQueue.setUrl("http://www.id1.com/");
    
            urlQueueService.insert(urlQueue);
    
            final OpenSearchUrlQueue urlQueue2 = new OpenSearchUrlQueue();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 5.8K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

         * Validates whether the URL queue entry is valid for crawling.
         * @param urlQueue The URL queue entry to validate.
         * @return true if valid, false otherwise.
         */
        protected boolean isValid(final UrlQueue<?> urlQueue) {
            if (urlQueue == null || StringUtil.isBlank(urlQueue.getUrl())
                    || crawlerContext.getMaxDepth() >= 0 && urlQueue.getDepth() > crawlerContext.getMaxDepth()) {
                return false;
            }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java

                    if (logger.isDebugEnabled()) {
                        logger.debug("Canceled urlQueue: {}", urlQueue);
                    }
                    // cancel crawling
                    crawlerContext.decrementAndGetAccessCount();
                    final List<UrlQueue<?>> newUrlQueueList = new ArrayList<>();
                    newUrlQueueList.add(urlQueue);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 12.5K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CrawlingParameterUtil.java

         * the URL queue for the current thread is removed.
         *
         * @param urlQueue the URL queue to be set for the current thread, or null to remove the URL queue
         */
        public static void setUrlQueue(final UrlQueue<?> urlQueue) {
            if (urlQueue == null) {
                URL_QUEUE_THREAD_LOCAL.remove();
            } else {
                URL_QUEUE_THREAD_LOCAL.set(urlQueue);
            }
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.4K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java

         * URL tracking when certain HTTP status codes are encountered.
         *
         * @param urlQueue the URL queue item that was processed
         * @param responseData the response data from the crawl operation
         */
        @Override
        protected void processResponse(final UrlQueue<?> urlQueue, final ResponseData responseData) {
            super.processResponse(urlQueue, responseData);
    
            final FessConfig fessConfig = ComponentUtil.getFessConfig();
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 19.1K bytes
    - Viewed (0)
Back to top