1 package org.wikimedia.search.extra.analysis.homoglyph;
2
3 import static java.util.Collections.singletonList;
4
5 import java.util.List;
6
7 import org.elasticsearch.index.analysis.PreConfiguredTokenFilter;
8 import org.elasticsearch.plugins.AnalysisPlugin;
9 import org.elasticsearch.plugins.Plugin;
10
11 public class HomoglyphPlugin extends Plugin implements AnalysisPlugin {
12
13 @Override
14 public List<PreConfiguredTokenFilter> getPreConfiguredTokenFilters() {
15 return singletonList(PreConfiguredTokenFilter.singleton("homoglyph_norm",
16 true, in -> new HomoglyphTokenFilter(in, new TranslationTable(
17 TranslationTableDictionaries.LATIN_REG, TranslationTableDictionaries.CYR_REG, TranslationTableDictionaries.LATIN_TO_CYRILLIC))));
18 }
19 }