Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 6 of 6 for Tokenizer (1.76 sec)

  1. src/main/resources/fess_indices/fess.json

    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Jun 06 14:17:42 UTC 2025
    - 39.8K bytes
    - Viewed (0)
  2. src/test/java/org/codelibs/fess/suggest/converter/AnalyzerConverterTest.java

                    .put("analysis.analyzer.test_reading_analyzer.tokenizer", "standard")
                    .put("analysis.analyzer.test_reading_term_analyzer.type", "custom")
                    .put("analysis.analyzer.test_reading_term_analyzer.tokenizer", "standard")
                    .put("analysis.analyzer.test_reading_analyzer_ja.type", "custom")
                    .put("analysis.analyzer.test_reading_analyzer_ja.tokenizer", "keyword")
    Registered: Sat Dec 20 13:04:59 UTC 2025
    - Last Modified: Mon Sep 01 13:33:03 UTC 2025
    - 12.5K bytes
    - Viewed (0)
  3. README.md

    String escaped = JsonUtil.escape("Hello \"World\" with special chars");
    String unescaped = JsonUtil.unescape(escaped);
    
    // Text tokenization
    Tokenizer tokenizer = new Tokenizer("field1,field2,field3", ",");
    while (tokenizer.hasMoreTokens()) {
        String token = tokenizer.nextToken();
        // Process each token
    }
    
    // Decimal formatting
    DecimalFormat format = DecimalFormatUtil.getDecimalFormat("###,###.00");
    ```
    
    Registered: Sat Dec 20 08:55:33 UTC 2025
    - Last Modified: Sun Aug 31 02:56:02 UTC 2025
    - 12.7K bytes
    - Viewed (0)
  4. src/test/java/org/codelibs/fess/suggest/analysis/SuggestAnalyzerTest.java

            List<AnalyzeToken> tokens = analyzer.analyzeAndReading(text, field, lang);
    
            assertNotNull(tokens);
            assertEquals(2, tokens.size()); // "Test123" and "ABC-456" (hyphen is not a split char in our tokenizer)
            assertEquals("Test123", tokens.get(0).getTerm());
            assertEquals("ABC-456", tokens.get(1).getTerm());
            assertEquals("TEST123", ((TestAnalyzeToken) tokens.get(0)).getReading());
    Registered: Sat Dec 20 13:04:59 UTC 2025
    - Last Modified: Mon Sep 01 13:33:03 UTC 2025
    - 15.7K bytes
    - Viewed (0)
  5. src/test/java/org/codelibs/opensearch/extension/analysis/NGramSynonymTokenizer.java

     */
    
    import java.io.IOException;
    import java.util.ArrayList;
    import java.util.Comparator;
    import java.util.List;
    import java.util.PriorityQueue;
    
    import org.apache.lucene.analysis.Tokenizer;
    import org.apache.lucene.analysis.synonym.SynonymMap;
    import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
    import org.apache.lucene.analysis.tokenattributes.OffsetAttribute;
    Registered: Sat Dec 20 13:04:59 UTC 2025
    - Last Modified: Sat Mar 15 06:51:20 UTC 2025
    - 17K bytes
    - Viewed (0)
  6. ADDING_NEW_LANGUAGE.md

          },
          "swedish_stemmer": {
            "type": "stemmer",
            "language": "swedish"
          }
        },
        "analyzer": {
          "sv_analyzer": {
            "type": "custom",
            "tokenizer": "standard",
            "filter": ["lowercase", "swedish_stop", "swedish_stemmer"]
          }
        }
      }
    }
    ```
    
    ### 2. Add Custom Dictionaries (Optional)
    
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Nov 06 11:36:30 UTC 2025
    - 10.4K bytes
    - Viewed (0)
Back to top