View Javadoc
1   package org.wikimedia.search.extra.analysis.homoglyph;
2   
3   import static java.util.Collections.singletonList;
4   
5   import java.util.List;
6   
7   import org.elasticsearch.index.analysis.PreConfiguredTokenFilter;
8   import org.elasticsearch.plugins.AnalysisPlugin;
9   import org.elasticsearch.plugins.Plugin;
10  
11  public class HomoglyphPlugin extends Plugin implements AnalysisPlugin {
12  
13      @Override
14      public List<PreConfiguredTokenFilter> getPreConfiguredTokenFilters() {
15          return singletonList(PreConfiguredTokenFilter.singleton("homoglyph_norm",
16                  true, in -> new HomoglyphTokenFilter(in, new TranslationTable(
17                          TranslationTableDictionaries.LATIN_REG, TranslationTableDictionaries.CYR_REG, TranslationTableDictionaries.LATIN_TO_CYRILLIC))));
18      }
19  }