26 lines
444 B
Ruby
26 lines
444 B
Ruby
# frozen_string_literal: true
|
|
|
|
class HashtagNormalizer
|
|
def normalize(str)
|
|
remove_invalid_characters(ascii_folding(lowercase(cjk_width(str))))
|
|
end
|
|
|
|
private
|
|
|
|
def remove_invalid_characters(str)
|
|
str.gsub(Tag::HASHTAG_INVALID_CHARS_RE, '')
|
|
end
|
|
|
|
def ascii_folding(str)
|
|
ASCIIFolding.new.fold(str)
|
|
end
|
|
|
|
def lowercase(str)
|
|
str.mb_chars.downcase.to_s
|
|
end
|
|
|
|
def cjk_width(str)
|
|
str.unicode_normalize(:nfkc)
|
|
end
|
|
end
|