- Sort Score
- Result 10 results
- Languages All
Results 1 - 9 of 9 for iterate (0.02 sec)
-
README.md
``` ## Data Access and Storage ### Accessing Crawled Data ```java // Get data service DataService dataService = container.getComponent("dataService"); // Iterate through crawled data dataService.iterate(sessionId, accessResult -> { System.out.println("URL: " + accessResult.getUrl()); System.out.println("Status: " + accessResult.getHttpStatusCode());
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Aug 31 05:32:52 UTC 2025 - 15.3K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/suggest/index/contents/document/ESSourceReader.java
import org.opensearch.transport.client.Client; /** * <p> * {@link ESSourceReader} reads documents from Elasticsearch using the scroll API. * It implements the {@link DocumentReader} interface to provide a way to iterate over documents * in a large index without loading all of them into memory at once. * </p> * * <p> * The reader supports limiting the number of documents read based on a percentage of the total documentsRegistered: Fri Sep 19 09:08:11 UTC 2025 - Last Modified: Thu Aug 07 02:41:28 UTC 2025 - 11K bytes - Viewed (0) -
fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchDataService.java
} /** * Iterates through all access results for a session, calling the callback for each result. * Uses OpenSearch scroll API for efficient iteration over large result sets. * * @param sessionId The session ID. * @param callback The callback to execute for each access result. */ @OverrideRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 10.9K bytes - Viewed (0) -
fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
assertTrue(urlQueue.getUrl().startsWith(url2)); } dataService.iterate(sessionId1, accessResult -> { assertTrue(accessResult.getUrl().startsWith(url1)); assertEquals(Constants.GET_METHOD, accessResult.getMethod()); }); dataService.iterate(sessionId2, accessResult -> { assertTrue(accessResult.getUrl().startsWith(url2));
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 12.8K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
assertTrue(urlQueue.getUrl().startsWith(url2)); } dataService.iterate(sessionId1, accessResult -> { assertTrue(accessResult.getUrl().startsWith(url1)); assertEquals(Constants.GET_METHOD, accessResult.getMethod()); }); dataService.iterate(sessionId2, accessResult -> { assertTrue(accessResult.getUrl().startsWith(url2));
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 19.1K bytes - Viewed (0) -
fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueService.java
* @param sessionId The new session ID. */ @Override public void generateUrlQueues(final String previousSessionId, final String sessionId) { dataService.iterate(previousSessionId, accessResult -> { final OpenSearchUrlQueue urlQueue = new OpenSearchUrlQueue(); urlQueue.setSessionId(sessionId); urlQueue.setMethod(accessResult.getMethod());Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 17K bytes - Viewed (1) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformerTest.java
assertEquals(content, new String(resultData.getData())); assertEquals(1, resultData.getChildUrlSet().size()); assertEquals("http://hoge/test2.html", resultData.getChildUrlSet().iterator().next().getUrl()); } public void test_transform_urllink() { String content = "<a href=\"http://fuga/test.html\">test</a>"; final byte[] data = new String(content).getBytes();
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 13.8K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformer.java
*/ package org.codelibs.fess.crawler.transformer.impl; import java.io.InputStream; import java.io.UnsupportedEncodingException; import java.util.ArrayList; import java.util.HashMap; import java.util.Iterator; import java.util.LinkedHashMap; import java.util.List; import java.util.Map; import java.util.concurrent.ExecutionException; import java.util.concurrent.TimeUnit; import java.util.regex.Matcher;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 23.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java
} throw new ExtractException("PDFBox process cannot finish in " + timeout + " sec."); } if (!exceptionSet.isEmpty()) { throw exceptionSet.iterator().next(); } writer.flush(); final ExtractData extractData = new ExtractData(writer.toString()); extractMetadata(document, extractData); return extractData;Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 12.7K bytes - Viewed (0)