- Sort Score
- Result 10 results
- Languages All
Results 1 - 7 of 7 for normalize_text (0.05 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java
* PDF config file path. */ public static final String TIKA_PDF_CONFIG = "tika.pdf.config"; /** * A parameter key to normalize a text. */ public static final String NORMALIZE_TEXT = "normalize_text"; private static final String FILE_PASSWORD = "fess.file.password"; /** * Output encoding. */ protected String outputEncoding = Constants.UTF_8; /**
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 30.7K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/transformer/AbstractFessFileTransformer.java
if (configParam != null) { final String keepOriginalBody = configParam.get(Config.KEEP_ORIGINAL_BODY); if (StringUtil.isNotBlank(keepOriginalBody)) { params.put(TikaExtractor.NORMALIZE_TEXT, Constants.TRUE.equalsIgnoreCase(keepOriginalBody) ? Constants.FALSE : Constants.TRUE); } } return params; } /**
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 25.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/util/TextUtil.java
* duplicate term removal, and custom space characters. * * <p>Example usage: * <pre>{@code * Reader reader = new StringReader("Example text to normalize."); * String normalizedText = TextUtil.normalizeText(reader) * .initialCapacity(5000) * .maxAlphanumTermSize(100) * .maxSymbolTermSize(50)
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 12K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/util/TextUtilTest.java
assertEquals("", normalizeText(" ", 100, -1, 2, false)); assertEquals("", normalizeText(" ", 100, -1, 2, false)); assertEquals("", normalizeText("\t", 100, -1, 2, false)); assertEquals("", normalizeText("\t\t", 100, -1, 2, false)); assertEquals("", normalizeText("\t \t", 100, -1, 2, false)); assertEquals("123 abc", normalizeText(" 123 abc ", 100, -1, 2, false));
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 8.2K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/suggest/normalizer/ICUNormalizer.java
* the ICUNormalizer instance.</p> * * <p>Example usage:</p> * <pre> * ICUNormalizer normalizer = new ICUNormalizer("Any-Latin; NFD; [:Nonspacing Mark:] Remove; NFC"); * String normalizedText = normalizer.normalize("text to normalize", "field"); * </pre> * * @see com.ibm.icu.text.Transliterator */ public class ICUNormalizer implements Normalizer { /** The transliterator used for normalization. */
Registered: Fri Sep 19 09:08:11 UTC 2025 - Last Modified: Fri Jul 04 14:00:23 UTC 2025 - 1.9K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/suggest/normalizer/NormalizerChain.java
* * <p>Usage example:</p> * <pre> * NormalizerChain chain = new NormalizerChain(); * chain.add(new SomeNormalizer()); * chain.add(new AnotherNormalizer()); * String normalizedText = chain.normalize("input text", "field", "en"); * </pre> * * <p>Methods:</p> * <ul> * <li>{@link #normalize(String, String, String...)} - Applies all added normalizers to the input text.</li>
Registered: Fri Sep 19 09:08:11 UTC 2025 - Last Modified: Fri Jul 04 14:00:23 UTC 2025 - 2.2K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/helper/DocumentHelper.java
return StringUtil.EMPTY; // empty } final int[] spaceChars = getSpaceChars(); try (final Reader reader = new StringReader(title)) { return TextUtil.normalizeText(reader).initialCapacity(title.length()).spaceChars(spaceChars).execute(); } catch (final IOException e) { return StringUtil.EMPTY; // empty } } /**
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 17.2K bytes - Viewed (0)