Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 26 for FFiles (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/fs/FileSystemClient.java

                    final Set<RequestData> requestDataSet = new HashSet<>();
                    if (includeContent) {
                        final File[] files = file.listFiles();
                        if (files != null) {
                            for (final File f : files) {
                                final String childUri = f.toURI().toASCIIString();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.8K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/smb/SmbClientTest.java

            Files.createDirectory(testuser2Dir);
    
            Files.writeString(usersDir.resolve("file1.txt"), "file1");
            Path dir1 = usersDir.resolve("dir1");
            Files.createDirectory(dir1);
            Files.writeString(dir1.resolve("file2.txt"), "file2");
            Path dir2 = dir1.resolve("dir2");
            Files.createDirectory(dir2);
            Files.writeString(dir2.resolve("file3.txt"), "file3");
            Path dir3 = usersDir.resolve("dir3");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 13.7K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/FileTransformer.java

            }
            return new File(baseDir, filePath);
        }
    
        /**
         * Gets the base path for storing files.
         *
         * @return the base path
         */
        public String getPath() {
            return path;
        }
    
        /**
         * Sets the base path for storing files.
         *
         * @param path the base path to set
         */
        public void setPath(final String path) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 11.7K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PasswordBasedExtractor.java

         */
        public PasswordBasedExtractor() {
            super();
        }
    
        /**
         * Adds a password for files matching the given regular expression pattern.
         * @param regex the regular expression pattern to match against URLs or resource names
         * @param password the password to use for matching files
         */
        public void addPassword(final String regex, final String password) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 5.1K bytes
    - Viewed (0)
  5. README.md

    #### Archives and Compressed Files
    - ZIP, TAR, GZ archives
    - LHA compression format
    - Nested archive extraction
    
    #### Web and Markup
    - HTML, XHTML with XPath support
    - XML documents
    - JSON and structured data
    
    #### Media Files
    - Audio formats (MP3, WAV, FLAC)
    - Video formats (MP4, AVI, MOV)
    - Metadata extraction from media files
    
    ## Architecture
    
    ### Multi-Module Structure
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb1/SmbClient.java

                    }
                    final Set<RequestData> requestDataSet = new HashSet<>(100);
                    if (includeContent) {
                        final SmbFile[] files = file.listFiles();
                        if (files != null) {
                            for (final SmbFile f : files) {
                                final String chileUri = f.toString();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Sep 18 09:30:45 UTC 2025
    - 23K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractor.java

    import jp.gr.java_conf.dangan.util.lha.LhaFile;
    import jp.gr.java_conf.dangan.util.lha.LhaHeader;
    
    /**
     * Extractor implementation for LHA (LZH) archive files.
     * This extractor can extract text content from files within LHA archives
     * by using appropriate extractors for each contained file type.
     *
     * @author shinsuke
     */
    public class LhaExtractor extends AbstractExtractor {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5.8K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

            // Without any patterns, all URLs should match
            assertTrue(urlFilter.match("https://example.com/"));
            assertTrue(urlFilter.match("https://test.com/page"));
            assertTrue(urlFilter.match("ftp://files.com/document.pdf"));
            assertTrue(urlFilter.match("file:///home/user/file.txt"));
        }
    
        /**
         * Test match with complex URL patterns
         */
        public void test_match_complexUrls() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb/SmbClient.java

                    }
                    final Set<RequestData> requestDataSet = new HashSet<>(100);
                    if (includeContent) {
                        final SmbFile[] files = file.listFiles();
                        if (files != null) {
                            for (final SmbFile f : files) {
                                final String childUri = f.getURL().toExternalForm();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Sep 18 09:30:45 UTC 2025
    - 22.5K bytes
    - Viewed (3)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java

    /**
     * PdfExtractor extracts text content from PDF files using Apache PDFBox.
     * It supports password-protected PDFs and can extract embedded documents and annotations.
     *
     * <p>The extractor runs text extraction in a separate thread with a configurable timeout
     * to prevent hanging on problematic PDF files. It also extracts metadata from the PDF
     * document and includes it in the extraction result.
     *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.7K bytes
    - Viewed (0)
Back to top