- Sort Score
- Result 10 results
- Languages All
Results 1 - 10 of 26 for FFiles (0.05 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/fs/FileSystemClient.java
final Set<RequestData> requestDataSet = new HashSet<>(); if (includeContent) { final File[] files = file.listFiles(); if (files != null) { for (final File f : files) { final String childUri = f.toURI().toASCIIString();
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 13.8K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/client/smb/SmbClientTest.java
Files.createDirectory(testuser2Dir); Files.writeString(usersDir.resolve("file1.txt"), "file1"); Path dir1 = usersDir.resolve("dir1"); Files.createDirectory(dir1); Files.writeString(dir1.resolve("file2.txt"), "file2"); Path dir2 = dir1.resolve("dir2"); Files.createDirectory(dir2); Files.writeString(dir2.resolve("file3.txt"), "file3"); Path dir3 = usersDir.resolve("dir3");
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 13.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/FileTransformer.java
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 11.7K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PasswordBasedExtractor.java
*/ public PasswordBasedExtractor() { super(); } /** * Adds a password for files matching the given regular expression pattern. * @param regex the regular expression pattern to match against URLs or resource names * @param password the password to use for matching files */ public void addPassword(final String regex, final String password) {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 5.1K bytes - Viewed (0) -
README.md
#### Archives and Compressed Files - ZIP, TAR, GZ archives - LHA compression format - Nested archive extraction #### Web and Markup - HTML, XHTML with XPath support - XML documents - JSON and structured data #### Media Files - Audio formats (MP3, WAV, FLAC) - Video formats (MP4, AVI, MOV) - Metadata extraction from media files ## Architecture ### Multi-Module Structure
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Aug 31 05:32:52 UTC 2025 - 15.3K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb1/SmbClient.java
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Sep 18 09:30:45 UTC 2025 - 23K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractor.java
import jp.gr.java_conf.dangan.util.lha.LhaFile; import jp.gr.java_conf.dangan.util.lha.LhaHeader; /** * Extractor implementation for LHA (LZH) archive files. * This extractor can extract text content from files within LHA archives * by using appropriate extractors for each contained file type. * * @author shinsuke */ public class LhaExtractor extends AbstractExtractor {
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 5.8K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java
// Without any patterns, all URLs should match assertTrue(urlFilter.match("https://example.com/")); assertTrue(urlFilter.match("https://test.com/page")); assertTrue(urlFilter.match("ftp://files.com/document.pdf")); assertTrue(urlFilter.match("file:///home/user/file.txt")); } /** * Test match with complex URL patterns */ public void test_match_complexUrls() {Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Wed Sep 03 14:42:53 UTC 2025 - 19K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb/SmbClient.java
} final Set<RequestData> requestDataSet = new HashSet<>(100); if (includeContent) { final SmbFile[] files = file.listFiles(); if (files != null) { for (final SmbFile f : files) { final String childUri = f.getURL().toExternalForm();Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Sep 18 09:30:45 UTC 2025 - 22.5K bytes - Viewed (3) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java
/** * PdfExtractor extracts text content from PDF files using Apache PDFBox. * It supports password-protected PDFs and can extract embedded documents and annotations. * * <p>The extractor runs text extraction in a separate thread with a configurable timeout * to prevent hanging on problematic PDF files. It also extracts metadata from the PDF * document and includes it in the extraction result. *
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 12.7K bytes - Viewed (0)