Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 16 for LOCAL (0.01 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CrawlingParameterUtil.java

        /**
         * Sets the current {@link CrawlerContext} for the current thread.
         * If the provided {@code crawlerContext} is {@code null}, the context is removed from the thread-local storage.
         * Otherwise, the provided {@code crawlerContext} is set in the thread-local storage.
         *
         * @param crawlerContext the {@link CrawlerContext} to be set for the current thread, or {@code null} to remove the context.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.4K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java

            this.maxAccessCount = maxAccessCount;
        }
    
        /**
         * Adds sitemaps to the thread-local storage.
         * @param sitemaps An array of sitemap URLs.
         */
        public void addSitemaps(final String[] sitemaps) {
            sitemapsLocal.set(sitemaps);
        }
    
        /**
         * Removes sitemaps from the thread-local storage and returns them.
         * @return An array of sitemap URLs, or null if none were present.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.9K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/ftp/FtpClient.java

        }
    
        /**
         * Gets the local IP address for passive mode FTP.
         *
         * @return The passive local host IP address
         */
        public String getPassiveLocalHost() {
            return passiveLocalHost;
        }
    
        /**
         * Sets the local IP address for passive mode FTP.
         *
         * @param passiveLocalHost The passive local host IP address
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 39.5K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

        protected String contentXpath = "//BODY";
    
        /** Map of metadata field names to their corresponding XPath expressions. */
        protected Map<String, String> metadataXpathMap = new HashMap<>();
    
        /** Thread-local instance of XPathAPI for thread-safe XPath evaluation. */
        private final ThreadLocal<XPathAPI> xpathAPI = new ThreadLocal<>();
    
        /**
         * Creates a new HtmlExtractor instance.
         */
        public HtmlExtractor() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  5. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueService.java

                }
            }
        }
    
        /**
         * Polls the next URL queue entry for the specified session.
         * This method manages local caches and fetches from OpenSearch when needed.
         *
         * @param sessionId The session ID.
         * @return The next URL queue entry, or null if none available.
         */
        @Override
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 17K bytes
    - Viewed (1)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java

    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.jodconverter.core.office.OfficeException;
    import org.jodconverter.core.office.OfficeManager;
    import org.jodconverter.local.LocalConverter;
    
    import jakarta.annotation.PostConstruct;
    import jakarta.annotation.PreDestroy;
    
    /**
     * Extracts text content from various document formats using JODConverter.
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  7. README.md

    crawler.urlFilter.addExclude(".*login.*");
    ```
    
    ## Supported Protocols and Formats
    
    ### Protocols
    - **HTTP/HTTPS**: Full web crawling support with cookies, authentication, redirects
    - **File System**: Local and network file system access
    - **FTP**: FTP server crawling with authentication
    - **SMB/CIFS**: Windows network shares
    - **Storage**: Cloud storage systems (MinIO, S3-compatible)
    
    ### Content Formats
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

            urlFilter.processUrl("https://example.com/");
            urlFilter.processUrl("http://test.com/path/to/page");
            urlFilter.processUrl("ftp://files.server.com/documents/");
            urlFilter.processUrl("file:///local/path/file.txt");
    
            // Should complete without errors
            assertNotNull(urlFilter);
        }
    
        /**
         * Test processUrl with null URL
         */
        public void test_processUrl_nullUrl() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  9. fess-crawler/pom.xml

    			<groupId>jp.gr.java_conf.dangan</groupId>
    			<artifactId>jlha</artifactId>
    			<version>${jlha.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.jodconverter</groupId>
    			<artifactId>jodconverter-local</artifactId>
    			<version>${jodconverter.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>com.sun.mail</groupId>
    			<artifactId>jakarta.mail</artifactId>
    			<version>${jakarta.mail.version}</version>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.3K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/JodExtractorTest.java

    import org.codelibs.core.io.ResourceUtil;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.dbflute.utflute.core.PlainTestCase;
    import org.jodconverter.local.office.LocalOfficeManager;
    
    /**
     * @author shinsuke
     *
     */
    public class JodExtractorTest extends PlainTestCase {
        private static final Logger logger = LogManager.getLogger(JodExtractorTest.class);
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 9.5K bytes
    - Viewed (0)
Back to top