Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 15 for iterator (0.04 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformer.java

     */
    package org.codelibs.fess.crawler.transformer.impl;
    
    import java.io.InputStream;
    import java.io.UnsupportedEncodingException;
    import java.util.ArrayList;
    import java.util.HashMap;
    import java.util.Iterator;
    import java.util.LinkedHashMap;
    import java.util.List;
    import java.util.Map;
    import java.util.concurrent.ExecutionException;
    import java.util.concurrent.TimeUnit;
    import java.util.regex.Matcher;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 23.9K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java

                    }
                    throw new ExtractException("PDFBox process cannot finish in " + timeout + " sec.");
                }
                if (!exceptionSet.isEmpty()) {
                    throw exceptionSet.iterator().next();
                }
                writer.flush();
                final ExtractData extractData = new ExtractData(writer.toString());
                extractMetadata(document, extractData);
                return extractData;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.7K bytes
    - Viewed (0)
  3. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchDataService.java

        }
    
        /**
         * Iterates through all access results for a session, calling the callback for each result.
         * Uses OpenSearch scroll API for efficient iteration over large result sets.
         *
         * @param sessionId The session ID.
         * @param callback The callback to execute for each access result.
         */
        @Override
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 10.9K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/DataServiceImpl.java

            return dataHelper.getAccessResultList(url);
        }
    
        /**
         * Iterates over all access results for the specified session.
         *
         * @param sessionId the session ID
         * @param accessResultCallback the callback to invoke for each access result
         */
        @Override
        public void iterate(final String sessionId, final AccessResultCallback<AccessResultImpl<Long>> accessResultCallback) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.8K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb/SmbAuthenticationHolder.java

     * authentication based on a given path.
     *
     * <p>This class manages a collection of {@link SmbAuthentication} objects, each associated
     * with a specific path prefix. When a path is provided, it iterates through the stored
     * authentications to find the one whose path prefix matches the beginning of the given path.
     * This allows for different SMB shares to use different authentication credentials.</p>
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.1K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/AccessResultCallback.java

         */
        /**
         * Processes the given access result.
         *
         * @param accessResult the result of the access operation to be processed
         */
        void iterate(RESULT accessResult);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.2K bytes
    - Viewed (0)
  7. README.md

    ```
    
    ## Data Access and Storage
    
    ### Accessing Crawled Data
    
    ```java
    // Get data service
    DataService dataService = container.getComponent("dataService");
    
    // Iterate through crawled data
    dataService.iterate(sessionId, accessResult -> {
        System.out.println("URL: " + accessResult.getUrl());
        System.out.println("Status: " + accessResult.getHttpStatusCode());
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

     * It parses the response body as a SitemapSet, extracts URLs from the sitemaps,
     * and adds them as child URLs to be crawled.
     *
     * <p>
     * This class uses a {@link SitemapsHelper} to parse the sitemap XML or text.
     * It then iterates through the sitemaps in the SitemapSet, extracts the URL
     * from each sitemap, and creates a new {@link RequestData} object for each URL.
     * These RequestData objects are added to a set of child URLs, which are then
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb1/SmbAuthenticationHolder.java

     * authentication based on a given path.
     *
     * <p>This class manages a collection of {@link SmbAuthentication} objects, each associated
     * with a specific path prefix. When a path is provided, it iterates through the stored
     * authentications to find the one whose path prefix matches the beginning of the given path.
     * This allows for different SMB shares to use different authentication credentials.</p>
     *
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.2K bytes
    - Viewed (0)
  10. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                    assertTrue(urlQueue.getUrl() + "=>" + url2, urlQueue.getUrl().startsWith(url2));
                }
    
                dataService.iterate(sessionId1, accessResult -> assertTrue(accessResult.getUrl().startsWith(url1)));
                dataService.iterate(sessionId2, accessResult -> assertTrue(accessResult.getUrl().startsWith(url2)));
    
                dataService.delete(sessionId1);
                dataService.delete(sessionId2);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 7.7K bytes
    - Viewed (0)
Back to top