Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 7 of 7 for normalize_text (0.08 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

         * PDF config file path.
         */
        public static final String TIKA_PDF_CONFIG = "tika.pdf.config";
    
        /**
         * A parameter key to normalize a text.
         */
        public static final String NORMALIZE_TEXT = "normalize_text";
    
        private static final String FILE_PASSWORD = "fess.file.password";
    
        /**
         * Output encoding.
         */
        protected String outputEncoding = Constants.UTF_8;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/crawler/transformer/AbstractFessFileTransformer.java

            if (configParam != null) {
                final String keepOriginalBody = configParam.get(Config.KEEP_ORIGINAL_BODY);
                if (StringUtil.isNotBlank(keepOriginalBody)) {
                    params.put(TikaExtractor.NORMALIZE_TEXT,
                            Constants.TRUE.equalsIgnoreCase(keepOriginalBody) ? Constants.FALSE : Constants.TRUE);
                }
            }
            return params;
        }
    
        /**
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 25.6K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/TextUtil.java

     * duplicate term removal, and custom space characters.
     *
     * <p>Example usage:
     * <pre>{@code
     * Reader reader = new StringReader("Example text to normalize.");
     * String normalizedText = TextUtil.normalizeText(reader)
     *                                  .initialCapacity(5000)
     *                                  .maxAlphanumTermSize(100)
     *                                  .maxSymbolTermSize(50)
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/TextUtilTest.java

            assertEquals("", normalizeText(" ", 100, -1, 2, false));
            assertEquals("", normalizeText("  ", 100, -1, 2, false));
            assertEquals("", normalizeText("\t", 100, -1, 2, false));
            assertEquals("", normalizeText("\t\t", 100, -1, 2, false));
            assertEquals("", normalizeText("\t \t", 100, -1, 2, false));
            assertEquals("123 abc", normalizeText(" 123 abc ", 100, -1, 2, false));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 8.2K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/suggest/normalizer/ICUNormalizer.java

     * the ICUNormalizer instance.</p>
     *
     * <p>Example usage:</p>
     * <pre>
     * ICUNormalizer normalizer = new ICUNormalizer("Any-Latin; NFD; [:Nonspacing Mark:] Remove; NFC");
     * String normalizedText = normalizer.normalize("text to normalize", "field");
     * </pre>
     *
     * @see com.ibm.icu.text.Transliterator
     */
    public class ICUNormalizer implements Normalizer {
        /** The transliterator used for normalization. */
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Fri Jul 04 14:00:23 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/suggest/normalizer/NormalizerChain.java

     *
     * <p>Usage example:</p>
     * <pre>
     * NormalizerChain chain = new NormalizerChain();
     * chain.add(new SomeNormalizer());
     * chain.add(new AnotherNormalizer());
     * String normalizedText = chain.normalize("input text", "field", "en");
     * </pre>
     *
     * <p>Methods:</p>
     * <ul>
     *   <li>{@link #normalize(String, String, String...)} - Applies all added normalizers to the input text.</li>
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Fri Jul 04 14:00:23 UTC 2025
    - 2.2K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/helper/DocumentHelper.java

                return StringUtil.EMPTY; // empty
            }
    
            final int[] spaceChars = getSpaceChars();
            try (final Reader reader = new StringReader(title)) {
                return TextUtil.normalizeText(reader).initialCapacity(title.length()).spaceChars(spaceChars).execute();
            } catch (final IOException e) {
                return StringUtil.EMPTY; // empty
            }
        }
    
        /**
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 17.2K bytes
    - Viewed (0)
Back to top