Skip to content

Commit ec897ae

Browse files
committed
Fix random detection results in low accuracy mode
1 parent de8fb0b commit ec897ae

File tree

1 file changed

+4
-13
lines changed

1 file changed

+4
-13
lines changed

src/detector.rs

Lines changed: 4 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -136,11 +136,8 @@ impl LanguageDetector {
136136
detector.preload_language_models(&languages);
137137
}
138138

139-
if is_built_from_one_language || is_low_accuracy_mode_enabled {
140-
detector.preload_unique_ngram_models();
141-
}
142-
143139
if is_built_from_one_language {
140+
detector.preload_unique_ngram_models();
144141
detector.preload_most_common_ngram_models();
145142
}
146143

@@ -267,15 +264,12 @@ impl LanguageDetector {
267264
self.fivegram_language_models.remove(language);
268265
}
269266

270-
if self.is_built_from_one_language || self.is_low_accuracy_mode_enabled {
267+
if self.is_built_from_one_language {
271268
self.unigram_language_models.remove(language);
272269
self.unique_bigram_language_models.remove(language);
273270
self.unique_trigram_language_models.remove(language);
274271
self.unique_quadrigram_language_models.remove(language);
275272
self.unique_fivegram_language_models.remove(language);
276-
}
277-
278-
if self.is_built_from_one_language {
279273
self.most_common_unigram_language_models.remove(language);
280274
self.most_common_bigram_language_models.remove(language);
281275
self.most_common_trigram_language_models.remove(language);
@@ -293,15 +287,12 @@ impl LanguageDetector {
293287
self.fivegram_language_models.shrink_to_fit();
294288
}
295289

296-
if self.is_built_from_one_language || self.is_low_accuracy_mode_enabled {
290+
if self.is_built_from_one_language {
297291
self.unigram_language_models.shrink_to_fit();
298292
self.unique_bigram_language_models.shrink_to_fit();
299293
self.unique_trigram_language_models.shrink_to_fit();
300294
self.unique_quadrigram_language_models.shrink_to_fit();
301295
self.unique_fivegram_language_models.shrink_to_fit();
302-
}
303-
304-
if self.is_built_from_one_language {
305296
self.most_common_unigram_language_models.shrink_to_fit();
306297
self.most_common_bigram_language_models.shrink_to_fit();
307298
self.most_common_trigram_language_models.shrink_to_fit();
@@ -769,7 +760,7 @@ impl LanguageDetector {
769760
return values;
770761
}
771762

772-
if self.is_built_from_one_language || self.is_low_accuracy_mode_enabled {
763+
if self.is_built_from_one_language {
773764
if let Some(language) = self.detect_language_with_unique_and_common_ngrams(&words) {
774765
update_confidence_values(&mut values, language, 1.0);
775766
values.sort_by(confidence_values_comparator);

0 commit comments

Comments
 (0)