Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 53 for character (0.06 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CharUtil.java

    package org.codelibs.fess.crawler.util;
    
    /**
     * Utility class for character-related operations.
     */
    public final class CharUtil {
        /**
         * Private constructor to prevent instantiation of this utility class.
         */
        private CharUtil() {
        }
    
        /**
         * Checks if the given character is a valid URL character.
         *
         * Valid URL characters include:
         * - Lowercase letters (a-z)
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Nov 22 13:28:22 UTC 2025
    - 1.8K bytes
    - Viewed (1)
  2. src/main/java/org/codelibs/fess/dict/mapping/CharMappingItem.java

    /**
     * Represents a single character mapping rule that defines how input characters are mapped to output characters
     * for text analysis and search processing. This class is used in character mapping dictionaries to transform
     * text during indexing and search operations.
     *
     * <p>Each mapping item consists of one or more input character sequences that are mapped to a single output
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Nov 20 07:09:00 UTC 2025
    - 7.9K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/dict/mapping/CharMappingFile.java

    import org.dbflute.optional.OptionalEntity;
    
    /**
     * Character mapping file handler for managing character mapping dictionaries.
     * This class provides functionality to load, parse, and manage character mapping
     * rules that define how input characters should be transformed to output characters
     * during text analysis and search processing.
     *
     * Character mapping files contain mapping rules in the format:
     * input1,input2,... => output
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 20 05:56:45 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/core/lang/StringUtil.java

            if (chars.length >= 2 && Character.isUpperCase(chars[0]) && Character.isUpperCase(chars[1])) {
                return name;
            }
            chars[0] = Character.toLowerCase(chars[0]);
            return new String(chars);
        }
    
        /**
         * Capitalizes a string according to JavaBeans conventions.
         * Note: If the first two characters are uppercase, the string will not be capitalized.
         * <p>
    Registered: Sat Dec 20 08:55:33 UTC 2025
    - Last Modified: Sat Nov 22 11:21:59 UTC 2025
    - 21.5K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/CsvExtractor.java

                throw new ExtractException("Failed to parse CSV content", e);
            }
        }
    
        /**
         * Detects the delimiter character from a CSV line.
         *
         * @param line the CSV line to analyze
         * @return the detected delimiter character
         */
        protected Character detectDelimiter(final String line) {
            final char[] candidates = { ',', '\t', ';', '|' };
            int maxCount = 0;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Dec 11 08:38:29 UTC 2025
    - 12.8K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CharUtilTest.java

            for (char c : validChars.toCharArray()) {
                assertTrue("Character '" + c + "' should be a valid URL character", CharUtil.isUrlChar(c));
            }
        }
    
        public void test_isUrlChar_boundaryChars() {
            // Test boundary characters for ranges
            assertTrue(CharUtil.isUrlChar('a')); // first lowercase
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 5.6K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

     *       to extract child URLs.</li>
     *   <li><b>defaultEncoding:</b> The default character encoding to use if none is
     *       specified in the HTML content.</li>
     *   <li><b>preloadSizeForCharset:</b> The number of bytes to read from the input
     *       stream to determine the character set encoding.</li>
     *   <li><b>invalidUrlPattern:</b> A regular expression pattern used to identify
     *       invalid URLs.</li>
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Nov 29 07:42:33 UTC 2025
    - 30.5K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/ftp/FtpClient.java

        }
    
        /**
         * Determines the character set for the given file.
         * Currently returns the default charset configured for this client.
         *
         * @param file The file to determine the charset for
         * @return The character set name
         */
        protected String getCharSet(final File file) {
            return charset;
        }
    
        /**
         * Gets the character encoding used for FTP operations.
         *
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 40K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/fs/FileSystemClient.java

        }
    
        /**
         * Gets the character set for the given file.
         *
         * @param file the file to get the character set for
         * @return the character set
         */
        protected String getCharSet(final File file) {
            return charset;
        }
    
        /**
         * Gets the character encoding used for files.
         *
         * @return the character encoding
         */
        public String getCharset() {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 15.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/XmlUtil.java

        }
    
        /**
         * Strips invalid XML characters from the input string.
         *
         * This method removes characters that are not allowed in XML documents
         * according to the XML 1.0 specification. Valid characters include:
         * - Tab (0x9)
         * - Line feed (0xA)
         * - Carriage return (0xD)
         * - Any character between 0x20 and 0xD7FF
         * - Any character between 0xE000 and 0xFFFD
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Nov 22 13:28:22 UTC 2025
    - 9.5K bytes
    - Viewed (0)
Back to top