- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 11 for locale (0.14 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java
import java.io.PrintStream; import java.io.Reader; import java.io.Writer; import java.util.ArrayList; import java.util.Arrays; import java.util.Collections; import java.util.List; import java.util.Locale; import java.util.Map; import java.util.Properties; import java.util.concurrent.ConcurrentHashMap; import java.util.function.BiConsumer; import java.util.stream.Collectors;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 30.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler; import java.text.SimpleDateFormat; import java.util.Date; import java.util.Locale; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.crawler.client.CrawlerClientFactory;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 14K bytes - Viewed (0) -
README.md
crawler.urlFilter.addExclude(".*login.*"); ``` ## Supported Protocols and Formats ### Protocols - **HTTP/HTTPS**: Full web crawling support with cookies, authentication, redirects - **File System**: Local and network file system access - **FTP**: FTP server crawling with authentication - **SMB/CIFS**: Windows network shares - **Storage**: Cloud storage systems (MinIO, S3-compatible) ### Content Formats
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Aug 31 05:32:52 UTC 2025 - 15.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/ftp/FtpClient.java
} /** * Gets the local IP address for passive mode FTP. * * @return The passive local host IP address */ public String getPassiveLocalHost() { return passiveLocalHost; } /** * Sets the local IP address for passive mode FTP. * * @param passiveLocalHost The passive local host IP address */Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 39.5K bytes - Viewed (0) -
fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueService.java
} } } /** * Polls the next URL queue entry for the specified session. * This method manages local caches and fetches from OpenSearch when needed. * * @param sessionId The session ID. * @return The next URL queue entry, or null if none available. */ @OverrideRegistered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 17K bytes - Viewed (1) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java
import org.codelibs.fess.crawler.extractor.Extractor; import org.jodconverter.core.office.OfficeException; import org.jodconverter.core.office.OfficeManager; import org.jodconverter.local.LocalConverter; import jakarta.annotation.PostConstruct; import jakarta.annotation.PreDestroy; /** * Extracts text content from various document formats using JODConverter. */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10.3K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java
urlFilter.processUrl("https://example.com/"); urlFilter.processUrl("http://test.com/path/to/page"); urlFilter.processUrl("ftp://files.server.com/documents/"); urlFilter.processUrl("file:///local/path/file.txt"); // Should complete without errors assertNotNull(urlFilter); } /** * Test processUrl with null URL */ public void test_processUrl_nullUrl() {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Wed Sep 03 14:42:53 UTC 2025 - 19K bytes - Viewed (0) -
fess-crawler/pom.xml
<groupId>jp.gr.java_conf.dangan</groupId> <artifactId>jlha</artifactId> <version>${jlha.version}</version> </dependency> <dependency> <groupId>org.jodconverter</groupId> <artifactId>jodconverter-local</artifactId> <version>${jodconverter.version}</version> </dependency> <dependency> <groupId>com.sun.mail</groupId> <artifactId>jakarta.mail</artifactId> <version>${jakarta.mail.version}</version>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 11.3K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java
String[] emptyArray = crawlerContext.removeSitemaps(); assertNotNull(emptyArray); assertEquals(0, emptyArray.length); } /** * Test thread-local nature of sitemaps */ public void test_sitemaps_threadLocal() throws Exception { final String[] thread1Sitemaps = new String[] { "http://thread1.com/sitemap.xml" };
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 25.6K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/RuleManagerTest.java
Rule matchedRule2 = ruleManager.getRule(responseData2); assertEquals("pdfRule", matchedRule2.getRuleId()); ResponseData responseData3 = new ResponseData(); responseData3.setUrl("file:///local/file.txt"); Rule matchedRule3 = ruleManager.getRule(responseData3); assertNull(matchedRule3); // No match } /** * Test rule order preservation */
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 23.8K bytes - Viewed (0)