Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 21 for locale (0.09 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/EncodingHelper.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.helper;
    
    import java.util.HashMap;
    import java.util.Locale;
    import java.util.Map;
    
    import org.codelibs.core.lang.StringUtil;
    
    /**
     * EncodingHelper provides utility methods for managing and normalizing character encodings.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.2K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

    import java.io.PrintStream;
    import java.io.Reader;
    import java.io.Writer;
    import java.util.ArrayList;
    import java.util.Arrays;
    import java.util.Collections;
    import java.util.List;
    import java.util.Locale;
    import java.util.Map;
    import java.util.Properties;
    import java.util.concurrent.ConcurrentHashMap;
    import java.util.function.BiConsumer;
    import java.util.stream.Collectors;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

     */
    package org.codelibs.fess.crawler.helper;
    
    import java.io.BufferedReader;
    import java.io.InputStream;
    import java.io.InputStreamReader;
    import java.util.ArrayList;
    import java.util.List;
    import java.util.Locale;
    import java.util.regex.Matcher;
    import java.util.regex.Pattern;
    
    import org.apache.commons.io.input.BOMInputStream;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.Constants;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/Crawler.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler;
    
    import java.text.SimpleDateFormat;
    import java.util.Date;
    import java.util.Locale;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.client.CrawlerClientFactory;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

    import java.net.UnknownHostException;
    import java.text.ParseException;
    import java.text.SimpleDateFormat;
    import java.util.ArrayList;
    import java.util.Date;
    import java.util.HashMap;
    import java.util.List;
    import java.util.Locale;
    import java.util.Map;
    import java.util.concurrent.TimeUnit;
    import java.util.regex.Pattern;
    
    import javax.net.ssl.SSLContext;
    
    import org.apache.commons.io.output.DeferredFileOutputStream;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 52.2K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CrawlingParameterUtil.java

        /**
         * Sets the current {@link CrawlerContext} for the current thread.
         * If the provided {@code crawlerContext} is {@code null}, the context is removed from the thread-local storage.
         * Otherwise, the provided {@code crawlerContext} is set in the thread-local storage.
         *
         * @param crawlerContext the {@link CrawlerContext} to be set for the current thread, or {@code null} to remove the context.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.4K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

        protected String contentXpath = "//BODY";
    
        /** Map of metadata field names to their corresponding XPath expressions. */
        protected Map<String, String> metadataXpathMap = new HashMap<>();
    
        /** Thread-local instance of XPathAPI for thread-safe XPath evaluation. */
        private final ThreadLocal<XPathAPI> xpathAPI = new ThreadLocal<>();
    
        /**
         * Creates a new HtmlExtractor instance.
         */
        public HtmlExtractor() {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  8. README.md

    crawler.urlFilter.addExclude(".*login.*");
    ```
    
    ## Supported Protocols and Formats
    
    ### Protocols
    - **HTTP/HTTPS**: Full web crawling support with cookies, authentication, redirects
    - **File System**: Local and network file system access
    - **FTP**: FTP server crawling with authentication
    - **SMB/CIFS**: Windows network shares
    - **Storage**: Cloud storage systems (MinIO, S3-compatible)
    
    ### Content Formats
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java

            this.maxAccessCount = maxAccessCount;
        }
    
        /**
         * Adds sitemaps to the thread-local storage.
         * @param sitemaps An array of sitemap URLs.
         */
        public void addSitemaps(final String[] sitemaps) {
            sitemapsLocal.set(sitemaps);
        }
    
        /**
         * Removes sitemaps from the thread-local storage and returns them.
         * @return An array of sitemap URLs, or null if none were present.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.9K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/ftp/FtpClient.java

        }
    
        /**
         * Gets the local IP address for passive mode FTP.
         *
         * @return The passive local host IP address
         */
        public String getPassiveLocalHost() {
            return passiveLocalHost;
        }
    
        /**
         * Sets the local IP address for passive mode FTP.
         *
         * @param passiveLocalHost The passive local host IP address
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 39.5K bytes
    - Viewed (0)
Back to top