- Sort Score
- Result 10 results
- Languages All
Results 1 - 4 of 4 for normalize_text (0.14 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java
* PDF config file path. */ public static final String TIKA_PDF_CONFIG = "tika.pdf.config"; /** * A parameter key to normalize a text. */ public static final String NORMALIZE_TEXT = "normalize_text"; private static final String FILE_PASSWORD = "fess.file.password"; /** * Output encoding. */ protected String outputEncoding = Constants.UTF_8; /**
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 30.7K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/transformer/AbstractFessFileTransformer.java
if (configParam != null) { final String keepOriginalBody = configParam.get(Config.KEEP_ORIGINAL_BODY); if (StringUtil.isNotBlank(keepOriginalBody)) { params.put(TikaExtractor.NORMALIZE_TEXT, Constants.TRUE.equalsIgnoreCase(keepOriginalBody) ? Constants.FALSE : Constants.TRUE); } } return params; } /**
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 25.6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/util/TextUtil.java
* duplicate term removal, and custom space characters. * * <p>Example usage: * <pre>{@code * Reader reader = new StringReader("Example text to normalize."); * String normalizedText = TextUtil.normalizeText(reader) * .initialCapacity(5000) * .maxAlphanumTermSize(100) * .maxSymbolTermSize(50)
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 12K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/helper/DocumentHelper.java
return StringUtil.EMPTY; // empty } final int[] spaceChars = getSpaceChars(); try (final Reader reader = new StringReader(title)) { return TextUtil.normalizeText(reader).initialCapacity(title.length()).spaceChars(spaceChars).execute(); } catch (final IOException e) { return StringUtil.EMPTY; // empty } } /**
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Aug 07 03:06:29 UTC 2025 - 17.2K bytes - Viewed (0)