|
12 | 12 | import opennlp.tools.tokenize.TokenizerME; |
13 | 13 | import opennlp.tools.tokenize.TokenizerModel; |
14 | 14 | import opennlp.tools.util.Span; |
| 15 | +import org.apache.commons.lang.StringUtils; |
15 | 16 | import org.arabidopsis.ahocorasick.AhoCorasick; |
16 | 17 | import org.arabidopsis.ahocorasick.SearchResult; |
17 | 18 | import org.tartarus.snowball.SnowballStemmer; |
@@ -73,29 +74,29 @@ public DictionaryAnnotator(DictionaryStore _dictionary, String _stemmingLanguage |
73 | 74 | } |
74 | 75 |
|
75 | 76 | // if no stemming language configuration is provided set stemming language to None |
76 | | - if (stemmingLanguage == null || stemmingLanguage.isEmpty()) { |
77 | | - stemmingLanguage = "None"; |
| 77 | + if (StringUtils.isBlank(stemmingLanguage)) { |
| 78 | + stemmingLanguage = "none"; |
78 | 79 | } |
79 | 80 | // create a mapping between the language and the name of the class |
80 | 81 | // responsible for the stemming of the current language |
81 | 82 | languages = new HashMap<>(); |
82 | | - languages.put("None", ""); |
83 | | - languages.put("Danish", "danishStemmer"); |
84 | | - languages.put("Dutch", "dutchStemmer"); |
85 | | - languages.put("English", "englishStemmer"); |
86 | | - languages.put("Finnish", "finnishStemmer"); |
87 | | - languages.put("French", "frenchStemmer"); |
88 | | - languages.put("German", "germanStemmer"); |
89 | | - languages.put("Hungarian", "hungarianStemmer"); |
90 | | - languages.put("Italian", "italianStemmer"); |
91 | | - languages.put("Norwegian", "norwegianStemmer"); |
92 | | - //languages.put("english2", "porterStemmer"); |
93 | | - languages.put("Portuguese", "portugueseStemmer"); |
94 | | - languages.put("Romanian", "romanianStemmer"); |
95 | | - languages.put("Russian", "russianStemmer"); |
96 | | - languages.put("Spanish", "spanishStemmer"); |
97 | | - languages.put("Swedish", "swedishStemmer"); |
98 | | - languages.put("Turkish", "turkishStemmer"); |
| 83 | + languages.put("none", ""); |
| 84 | + languages.put("danish", "danishStemmer"); |
| 85 | + languages.put("dutch", "dutchStemmer"); |
| 86 | + languages.put("english", "englishStemmer"); |
| 87 | + languages.put("finnish", "finnishStemmer"); |
| 88 | + languages.put("french", "frenchStemmer"); |
| 89 | + languages.put("german", "germanStemmer"); |
| 90 | + languages.put("hungarian", "hungarianStemmer"); |
| 91 | + languages.put("italian", "italianStemmer"); |
| 92 | + languages.put("norwegian", "norwegianStemmer"); |
| 93 | + languages.put("english2", "porterStemmer"); |
| 94 | + languages.put("portuguese", "portugueseStemmer"); |
| 95 | + languages.put("romanian", "romanianStemmer"); |
| 96 | + languages.put("russian", "russianStemmer"); |
| 97 | + languages.put("spanish", "spanishStemmer"); |
| 98 | + languages.put("swedish", "swedishStemmer"); |
| 99 | + languages.put("turkish", "turkishStemmer"); |
99 | 100 |
|
100 | 101 | originalDictionary = new DictionaryStore(); |
101 | 102 | processedDictionary = new DictionaryStore(); |
|
0 commit comments