- Sort Score
- Result 10 results
- Languages All
Results 1 - 5 of 5 for normalize_text (0.2 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java
public static final String TIKA_TESSERACT_CONFIG = "tika.tesseract.config"; public static final String TIKA_PDF_CONFIG = "tika.pdf.config"; public static final String NORMALIZE_TEXT = "normalize_text"; private static final String FILE_PASSWORD = "fess.file.password"; protected String outputEncoding = Constants.UTF_8; protected boolean readAsTextIfFailed = false;
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sat Oct 12 01:41:37 UTC 2024 - 25K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/crawler/transformer/AbstractFessFileTransformer.java
if (configParam != null) { final String keepOriginalBody = configParam.get(Config.KEEP_ORIGINAL_BODY); if (StringUtil.isNotBlank(keepOriginalBody)) { params.put(TikaExtractor.NORMALIZE_TEXT, Constants.TRUE.equalsIgnoreCase(keepOriginalBody) ? Constants.FALSE : Constants.TRUE); } } return params; }
Registered: Thu Oct 31 13:40:30 UTC 2024 - Last Modified: Fri Oct 11 21:11:58 UTC 2024 - 23.6K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/util/TextUtilTest.java
assertEquals("", normalizeText(" ", 100, -1, 2, false)); assertEquals("", normalizeText(" ", 100, -1, 2, false)); assertEquals("", normalizeText("\t", 100, -1, 2, false)); assertEquals("", normalizeText("\t\t", 100, -1, 2, false)); assertEquals("", normalizeText("\t \t", 100, -1, 2, false)); assertEquals("123 abc", normalizeText(" 123 abc ", 100, -1, 2, false));
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Thu Feb 22 01:36:27 UTC 2024 - 8.2K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/helper/DocumentHelper.java
return StringUtil.EMPTY; // empty } final int[] spaceChars = getSpaceChars(); try (final Reader reader = new StringReader(title)) { return TextUtil.normalizeText(reader).initialCapacity(title.length()).spaceChars(spaceChars).execute(); } catch (final IOException e) { return StringUtil.EMPTY; // empty } }
Registered: Thu Oct 31 13:40:30 UTC 2024 - Last Modified: Thu Feb 22 01:53:18 UTC 2024 - 12K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/util/TextUtil.java
public TextNormalizeContext spaceChars(final int[] spaceChars) { this.spaceChars = spaceChars; return this; } } public static TextNormalizeContext normalizeText(final Reader reader) { return new TextNormalizeContext(reader); } private static boolean isLastSpaceChar(final StringBuilder buf) { if (buf.length() == 0) { return false;
Registered: Sun Nov 10 03:50:12 UTC 2024 - Last Modified: Sat Oct 12 01:40:57 UTC 2024 - 7.9K bytes - Viewed (0)