Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 11 for locale (0.14 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

    import java.io.PrintStream;
    import java.io.Reader;
    import java.io.Writer;
    import java.util.ArrayList;
    import java.util.Arrays;
    import java.util.Collections;
    import java.util.List;
    import java.util.Locale;
    import java.util.Map;
    import java.util.Properties;
    import java.util.concurrent.ConcurrentHashMap;
    import java.util.function.BiConsumer;
    import java.util.stream.Collectors;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler;
    
    import java.text.SimpleDateFormat;
    import java.util.Date;
    import java.util.Locale;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.client.CrawlerClientFactory;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  3. README.md

    crawler.urlFilter.addExclude(".*login.*");
    ```
    
    ## Supported Protocols and Formats
    
    ### Protocols
    - **HTTP/HTTPS**: Full web crawling support with cookies, authentication, redirects
    - **File System**: Local and network file system access
    - **FTP**: FTP server crawling with authentication
    - **SMB/CIFS**: Windows network shares
    - **Storage**: Cloud storage systems (MinIO, S3-compatible)
    
    ### Content Formats
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/ftp/FtpClient.java

        }
    
        /**
         * Gets the local IP address for passive mode FTP.
         *
         * @return The passive local host IP address
         */
        public String getPassiveLocalHost() {
            return passiveLocalHost;
        }
    
        /**
         * Sets the local IP address for passive mode FTP.
         *
         * @param passiveLocalHost The passive local host IP address
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 39.5K bytes
    - Viewed (0)
  5. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueService.java

                }
            }
        }
    
        /**
         * Polls the next URL queue entry for the specified session.
         * This method manages local caches and fetches from OpenSearch when needed.
         *
         * @param sessionId The session ID.
         * @return The next URL queue entry, or null if none available.
         */
        @Override
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 17K bytes
    - Viewed (1)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java

    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.jodconverter.core.office.OfficeException;
    import org.jodconverter.core.office.OfficeManager;
    import org.jodconverter.local.LocalConverter;
    
    import jakarta.annotation.PostConstruct;
    import jakarta.annotation.PreDestroy;
    
    /**
     * Extracts text content from various document formats using JODConverter.
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

            urlFilter.processUrl("https://example.com/");
            urlFilter.processUrl("http://test.com/path/to/page");
            urlFilter.processUrl("ftp://files.server.com/documents/");
            urlFilter.processUrl("file:///local/path/file.txt");
    
            // Should complete without errors
            assertNotNull(urlFilter);
        }
    
        /**
         * Test processUrl with null URL
         */
        public void test_processUrl_nullUrl() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  8. fess-crawler/pom.xml

    			<groupId>jp.gr.java_conf.dangan</groupId>
    			<artifactId>jlha</artifactId>
    			<version>${jlha.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.jodconverter</groupId>
    			<artifactId>jodconverter-local</artifactId>
    			<version>${jodconverter.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>com.sun.mail</groupId>
    			<artifactId>jakarta.mail</artifactId>
    			<version>${jakarta.mail.version}</version>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.3K bytes
    - Viewed (0)
  9. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java

            String[] emptyArray = crawlerContext.removeSitemaps();
            assertNotNull(emptyArray);
            assertEquals(0, emptyArray.length);
        }
    
        /**
         * Test thread-local nature of sitemaps
         */
        public void test_sitemaps_threadLocal() throws Exception {
            final String[] thread1Sitemaps = new String[] { "http://thread1.com/sitemap.xml" };
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 25.6K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/RuleManagerTest.java

            Rule matchedRule2 = ruleManager.getRule(responseData2);
            assertEquals("pdfRule", matchedRule2.getRuleId());
    
            ResponseData responseData3 = new ResponseData();
            responseData3.setUrl("file:///local/file.txt");
            Rule matchedRule3 = ruleManager.getRule(responseData3);
            assertNull(matchedRule3); // No match
        }
    
        /**
         * Test rule order preservation
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 23.8K bytes
    - Viewed (0)
Back to top