require_relative "name/constants" module Unicode module Name HANGUL_START = 44032 HANGUL_END = 55203 HANGUL_MEDIAL_MAX = 588 HANGUL_FINAL_MAX = 28 # Don't overwrite Module.name def self.unicode_name(char) codepoint = char.unpack("U")[0] require_relative "name/index" unless defined? ::Unicode::Name::INDEX if res = INDEX[:NAMES][codepoint] res elsif INDEX[:CJK].any?{ |cjk_range| codepoint >= cjk_range[0] && codepoint <= cjk_range[1] } "CJK UNIFIED IDEOGRAPH-%.4X" % codepoint elsif codepoint >= HANGUL_START && codepoint <= HANGUL_END "HANGUL SYLLABLE %s" % hangul_decomposition(codepoint) else nil end end class << self; alias of unicode_name; end def self.correct(char) codepoint = char.unpack("U")[0] require_relative "name/index" unless defined? ::Unicode::Name::INDEX if correction = INDEX[:ALIASES][codepoint] && INDEX[:ALIASES][codepoint][:correction] && INDEX[:ALIASES][codepoint][:correction][-1] correction else unicode_name(char) end end def self.aliases(char) codepoint = char.unpack("U")[0] require_relative "name/index" unless defined? ::Unicode::Name::INDEX INDEX[:ALIASES][codepoint] end def self.label(char) codepoint = char.unpack("U")[0] codepoint_pretty = "%.4X" % codepoint require_relative "name/index" unless defined? ::Unicode::Name::INDEX require "unicode/types" unless defined? ::Unicode::Types case Unicode::Types.type(char) when "Graphic", "Format" nil when "Control" "" when "Private-use" "" when "Surrogate" "" when "Noncharacter" "" when "Reserved" "" end end def self.readable(char) correct(char) || ( as = aliases(char) ) && ( as[:control] && as[:control][0] || as[:figment] && as[:figment][0] || as[:alternate] && as[:alternate][0] || as[:abbreviation] && as[:abbreviation][0] ) || label(char) end private # See https://en.wikipedia.org/wiki/Korean_language_and_computers#Hangul_Syllables_Area def self.hangul_decomposition(codepoint) base = codepoint - HANGUL_START final = base % HANGUL_FINAL_MAX medial = (base % HANGUL_MEDIAL_MAX) / HANGUL_FINAL_MAX initial = base / HANGUL_MEDIAL_MAX "#{INDEX[:JAMO][:INITIAL][initial]}#{INDEX[:JAMO][:MEDIAL][medial]}#{INDEX[:JAMO][:FINAL][final]}" end end end