Changeset 33634 for gs3-extensions/maori-lang-detection/src/org/greenstone/atea/TextLanguageDetector.java
- Timestamp:
- 2019-11-08T23:59:07+13:00 (4 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
gs3-extensions/maori-lang-detection/src/org/greenstone/atea/TextLanguageDetector.java
r33633 r33634 142 142 } 143 143 144 /** inner class */145 public class SentenceInfo {146 public final double confidenceLevel;147 /** 3 letter lang code */148 public final String langCode;149 public final String sentence;150 151 public SentenceInfo(double confidence, String langCode, String sentence) {152 confidenceLevel = confidence;153 this.langCode = langCode;154 this.sentence = sentence;155 }156 }157 158 144 /** TODO: Is it sensible to use the Maori Language Sentence Model to split the text 159 145 * into sentences? What if the text in any other language or a mix of languages? … … 183 169 double confidence = bestLanguage.getConfidence(); 184 170 185 sentencesList.add(new SentenceInfo(confidence, bestLanguage , sentence));171 sentencesList.add(new SentenceInfo(confidence, bestLanguage.getLang(), sentence)); 186 172 } 187 173 … … 207 193 separator = " "; 208 194 } 209 sentence = sentence + separator + sentence [i];195 sentence = sentence + separator + sentences[i]; 210 196 211 197 //System.err.println(sentence); … … 214 200 double confidence = bestLanguage.getConfidence(); 215 201 216 sentencesList.add(new SentenceInfo(confidence, bestLanguage , sentence));202 sentencesList.add(new SentenceInfo(confidence, bestLanguage.getLang(), sentence)); 217 203 } 218 204
Note:
See TracChangeset
for help on using the changeset viewer.