Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 9 of 9 for iterate (0.02 sec)

  1. README.md

    ```
    
    ## Data Access and Storage
    
    ### Accessing Crawled Data
    
    ```java
    // Get data service
    DataService dataService = container.getComponent("dataService");
    
    // Iterate through crawled data
    dataService.iterate(sessionId, accessResult -> {
        System.out.println("URL: " + accessResult.getUrl());
        System.out.println("Status: " + accessResult.getHttpStatusCode());
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/suggest/index/contents/document/ESSourceReader.java

    import org.opensearch.transport.client.Client;
    
    /**
     * <p>
     * {@link ESSourceReader} reads documents from Elasticsearch using the scroll API.
     * It implements the {@link DocumentReader} interface to provide a way to iterate over documents
     * in a large index without loading all of them into memory at once.
     * </p>
     *
     * <p>
     * The reader supports limiting the number of documents read based on a percentage of the total documents
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 11K bytes
    - Viewed (0)
  3. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchDataService.java

        }
    
        /**
         * Iterates through all access results for a session, calling the callback for each result.
         * Uses OpenSearch scroll API for efficient iteration over large result sets.
         *
         * @param sessionId The session ID.
         * @param callback The callback to execute for each access result.
         */
        @Override
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 10.9K bytes
    - Viewed (0)
  4. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                    assertTrue(urlQueue.getUrl().startsWith(url2));
                }
    
                dataService.iterate(sessionId1, accessResult -> {
                    assertTrue(accessResult.getUrl().startsWith(url1));
                    assertEquals(Constants.GET_METHOD, accessResult.getMethod());
                });
                dataService.iterate(sessionId2, accessResult -> {
                    assertTrue(accessResult.getUrl().startsWith(url2));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 12.8K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                    assertTrue(urlQueue.getUrl().startsWith(url2));
                }
    
                dataService.iterate(sessionId1, accessResult -> {
                    assertTrue(accessResult.getUrl().startsWith(url1));
                    assertEquals(Constants.GET_METHOD, accessResult.getMethod());
                });
                dataService.iterate(sessionId2, accessResult -> {
                    assertTrue(accessResult.getUrl().startsWith(url2));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  6. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueService.java

         * @param sessionId The new session ID.
         */
        @Override
        public void generateUrlQueues(final String previousSessionId, final String sessionId) {
            dataService.iterate(previousSessionId, accessResult -> {
                final OpenSearchUrlQueue urlQueue = new OpenSearchUrlQueue();
                urlQueue.setSessionId(sessionId);
                urlQueue.setMethod(accessResult.getMethod());
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 17K bytes
    - Viewed (1)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformerTest.java

            assertEquals(content, new String(resultData.getData()));
            assertEquals(1, resultData.getChildUrlSet().size());
            assertEquals("http://hoge/test2.html", resultData.getChildUrlSet().iterator().next().getUrl());
        }
    
        public void test_transform_urllink() {
            String content = "<a href=\"http://fuga/test.html\">test</a>";
            final byte[] data = new String(content).getBytes();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 13.8K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformer.java

     */
    package org.codelibs.fess.crawler.transformer.impl;
    
    import java.io.InputStream;
    import java.io.UnsupportedEncodingException;
    import java.util.ArrayList;
    import java.util.HashMap;
    import java.util.Iterator;
    import java.util.LinkedHashMap;
    import java.util.List;
    import java.util.Map;
    import java.util.concurrent.ExecutionException;
    import java.util.concurrent.TimeUnit;
    import java.util.regex.Matcher;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 23.9K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java

                    }
                    throw new ExtractException("PDFBox process cannot finish in " + timeout + " sec.");
                }
                if (!exceptionSet.isEmpty()) {
                    throw exceptionSet.iterator().next();
                }
                writer.flush();
                final ExtractData extractData = new ExtractData(writer.toString());
                extractMetadata(document, extractData);
                return extractData;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.7K bytes
    - Viewed (0)
Back to top