RubygemsResearch

Sha256: c634c4db1e47bdebab85e69a8ea661d2fe2450cb7d8f6f0130a12a05435e09d7

Contents?: true

Size: 1.73 KB

Versions: 1

Compression:

Stored size: 1.73 KB

# encoding: UTF-8

# Copyright 2012 Twitter, Inc
# http://www.apache.org/licenses/LICENSE-2.0

module TwitterCldr
  module Shared
    class UnicodeData
      Attributes = Struct.new(:code_point, :name, :category, :combining_class, :bidi_class, :decomposition,
                             :digit_value, :non_decimal_digit_value, :numeric_value, :bidi_mirrored, :unicode1_name,
                             :iso_comment, :simple_uppercase_map, :simple_lowercase_map, :simple_titlecase_map)
      class << self
        def for_code_point(code_point)
          blocks = TwitterCldr.get_resource("unicode_data", "blocks")

          #Find the target block
          target = blocks.find do |block_name, range|
            range.include? code_point.to_i(16)
          end

          if target
            block_data = TwitterCldr.get_resource("unicode_data", target.first)
            code_point_data = block_data.fetch(code_point.to_sym) { |code_point_sym| get_range_start(code_point_sym, block_data) }
            Attributes.new(*code_point_data) if code_point_data
          end
        end

        private
        # Check if block constitutes a range. The code point beginning a range will have a name enclosed in <>, ending with 'First'
        # eg: <CJK Ideograph Extension A, First>
        # http://unicode.org/reports/tr44/#Code_Point_Ranges
        def get_range_start(code_point, block_data)
          start_code_point = block_data.keys.sort_by { |key| key.to_s.to_i(16) }.first
          start_data = block_data[start_code_point].clone
          if start_data[1] =~ /<.*, First>/
            start_data[0] = code_point.to_s
            start_data[1] = start_data[1].sub(', First', '')
            start_data
          end
        end
      end
    end
  end
end

Version data entries

1 entries across 1 versions & 1 rubygems

Version	Path
twitter_cldr-1.2.0	lib/twitter_cldr/shared/unicode_data.rb