about summary refs log tree commit diff
path: root/app/lib/hashtag_normalizer.rb
blob: c1f99e16383f5cad8516be848ec6dc2f43448d79 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
# frozen_string_literal: true

class HashtagNormalizer
  def normalize(str)
    remove_invalid_characters(ascii_folding(lowercase(cjk_width(str))))
  end

  private

  def remove_invalid_characters(str)
    str.gsub(/[^[:alnum:]#{Tag::HASHTAG_SEPARATORS}]/, '')
  end

  def ascii_folding(str)
    ASCIIFolding.new.fold(str)
  end

  def lowercase(str)
    str.mb_chars.downcase.to_s
  end

  def cjk_width(str)
    str.unicode_normalize(:nfkc)
  end
end