about summary refs log tree commit diff
path: root/app/lib
diff options
context:
space:
mode:
authorEugen Rochko <eugen@zeonfederated.com>2019-03-26 01:23:59 +0100
committerGitHub <noreply@github.com>2019-03-26 01:23:59 +0100
commite6cfa7ab897ac4fd6bf9bbcafe09fc42c4cc2c5d (patch)
tree619af1ebfd3bdb8690dbbabfaee3efa961c1e1cc /app/lib
parent94e5e834f2ddbc791ab27e2ef17eb2f23140a6ba (diff)
Change language detector threshold from 140 characters to 4 words (#10376)
Add `lang` attribute to statuses in web UI
Diffstat (limited to 'app/lib')
-rw-r--r--app/lib/language_detector.rb4
1 files changed, 2 insertions, 2 deletions
diff --git a/app/lib/language_detector.rb b/app/lib/language_detector.rb
index 70a9084d1..1e90af42d 100644
--- a/app/lib/language_detector.rb
+++ b/app/lib/language_detector.rb
@@ -3,7 +3,7 @@
 class LanguageDetector
   include Singleton
 
-  CHARACTER_THRESHOLD    = 140
+  WORDS_THRESHOLD        = 4
   RELIABLE_CHARACTERS_RE = /[\p{Hebrew}\p{Arabic}\p{Syriac}\p{Thaana}\p{Nko}\p{Han}\p{Katakana}\p{Hiragana}\p{Hangul}]+/m
 
   def initialize
@@ -37,7 +37,7 @@ class LanguageDetector
   end
 
   def sufficient_text_length?(text)
-    text.size >= CHARACTER_THRESHOLD
+    text.split(/\s+/).size >= WORDS_THRESHOLD
   end
 
   def language_specific_character_set?(text)