forked from specter/mastodon
26 lines
455 B
Ruby
26 lines
455 B
Ruby
|
# frozen_string_literal: true
|
||
|
|
||
|
class HashtagNormalizer
|
||
|
def normalize(str)
|
||
|
remove_invalid_characters(ascii_folding(lowercase(cjk_width(str))))
|
||
|
end
|
||
|
|
||
|
private
|
||
|
|
||
|
def remove_invalid_characters(str)
|
||
|
str.gsub(/[^[:alnum:]#{Tag::HASHTAG_SEPARATORS}]/, '')
|
||
|
end
|
||
|
|
||
|
def ascii_folding(str)
|
||
|
ASCIIFolding.new.fold(str)
|
||
|
end
|
||
|
|
||
|
def lowercase(str)
|
||
|
str.mb_chars.downcase.to_s
|
||
|
end
|
||
|
|
||
|
def cjk_width(str)
|
||
|
str.unicode_normalize(:nfkc)
|
||
|
end
|
||
|
end
|