about summary refs log tree commit diff
path: root/app/lib
diff options
context:
space:
mode:
authorEugen Rochko <eugen@zeonfederated.com>2019-07-18 03:02:15 +0200
committerGitHub <noreply@github.com>2019-07-18 03:02:15 +0200
commit5bfe1e1f0517a23637a1a132dbf0b62fd29982bc (patch)
tree1381c422424fe4cbf2b68839d2dcacc654796bb6 /app/lib
parent3a6fe657ba30c56677c271432338a7002191d772 (diff)
Change language detection to include hashtags as words (#11341)
Diffstat (limited to 'app/lib')
-rw-r--r--app/lib/language_detector.rb2
1 files changed, 1 insertions, 1 deletions
diff --git a/app/lib/language_detector.rb b/app/lib/language_detector.rb
index 1e90af42d..6f9511a54 100644
--- a/app/lib/language_detector.rb
+++ b/app/lib/language_detector.rb
@@ -69,7 +69,7 @@ class LanguageDetector
     new_text = remove_html(text)
     new_text.gsub!(FetchLinkCardService::URL_PATTERN, '')
     new_text.gsub!(Account::MENTION_RE, '')
-    new_text.gsub!(Tag::HASHTAG_RE, '')
+    new_text.gsub!(Tag::HASHTAG_RE) { |string| string.gsub(/[#_]/, '#' => '', '_' => ' ').gsub(/[a-z][A-Z]|[a-zA-Z][\d]/) { |s| s.insert(1, ' ') }.downcase }
     new_text.gsub!(/:#{CustomEmoji::SHORTCODE_RE_FRAGMENT}:/, '')
     new_text.gsub!(/\s+/, ' ')
     new_text