about summary refs log tree commit diff
path: root/app/lib/hashtag_normalizer.rb
blob: 49fa6101de086df3e3abc54b115989438e66c93c (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
# frozen_string_literal: true

class HashtagNormalizer
  def normalize(str)
    remove_invalid_characters(ascii_folding(lowercase(cjk_width(str))))
  end

  private

  def remove_invalid_characters(str)
    str.gsub(Tag::HASHTAG_INVALID_CHARS_RE, '')
  end

  def ascii_folding(str)
    ASCIIFolding.new.fold(str)
  end

  def lowercase(str)
    str.mb_chars.downcase.to_s
  end

  def cjk_width(str)
    str.unicode_normalize(:nfkc)
  end
end