okjson.rb in taps2-0.6.0

- old
+ new

@@ -39,152 +39,123 @@
   # String values in the resulting structure
   # will be UTF-8.
   def decode(s)
     ts = lex(s)
     v, ts = textparse(ts)
-    if ts.length > 0
-      raise OkJson::ParserError, 'trailing garbage'
-    end
+    raise OkJson::ParserError, 'trailing garbage' unless ts.empty?
     v
   end
 
-
   # Parses a "json text" in the sense of RFC 4627.
   # Returns the parsed value and any trailing tokens.
   # Note: this is almost the same as valparse,
   # except that it does not accept atomic values.
   def textparse(ts)
-    if ts.length < 0
-      raise OkJson::ParserError, 'empty'
-    end
+    raise OkJson::ParserError, 'empty' if ts.length < 0
 
     typ, _, val = ts[0]
     case typ
     when '{' then objparse(ts)
     when '[' then arrparse(ts)
     else valparse(ts)
     end
   end
 
-
   # Parses a "value" in the sense of RFC 4627.
   # Returns the parsed value and any trailing tokens.
   def valparse(ts)
-    if ts.length < 0
-      raise OkJson::ParserError, 'empty'
-    end
+    raise OkJson::ParserError, 'empty' if ts.length < 0
 
     typ, _, val = ts[0]
     case typ
     when '{' then objparse(ts)
     when '[' then arrparse(ts)
-    when :val,:str then [val, ts[1..-1]]
+    when :val, :str then [val, ts[1..-1]]
     else
       raise OkJson::ParserError, "unexpected #{val.inspect}"
     end
   end
 
-
   # Parses an "object" in the sense of RFC 4627.
   # Returns the parsed value and any trailing tokens.
   def objparse(ts)
     ts = eat('{', ts)
     obj = {}
 
-    if ts[0][0] == '}'
-      return obj, ts[1..-1]
-    end
+    return obj, ts[1..-1] if ts[0][0] == '}'
 
     k, v, ts = pairparse(ts)
     obj[k] = v
 
-    if ts[0][0] == '}'
-      return obj, ts[1..-1]
-    end
+    return obj, ts[1..-1] if ts[0][0] == '}'
 
     loop do
       ts = eat(',', ts)
 
       k, v, ts = pairparse(ts)
       obj[k] = v
 
-      if ts[0][0] == '}'
-        return obj, ts[1..-1]
-      end
+      return obj, ts[1..-1] if ts[0][0] == '}'
     end
   end
 
-
   # Parses a "member" in the sense of RFC 4627.
   # Returns the parsed value and any trailing tokens.
   def pairparse(ts)
-    (typ, _, k), ts = ts[0], ts[1..-1]
-    if typ != :str
-      raise OkJson::ParserError, "unexpected #{k.inspect}"
-    end
+    (typ, _, k) = ts[0]
+    ts = ts[1..-1]
+    raise OkJson::ParserError, "unexpected #{k.inspect}" if typ != :str
     ts = eat(':', ts)
     v, ts = valparse(ts)
     [k, v, ts]
   end
 
-
   # Parses an "array" in the sense of RFC 4627.
   # Returns the parsed value and any trailing tokens.
   def arrparse(ts)
     ts = eat('[', ts)
     arr = []
 
-    if ts[0][0] == ']'
-      return arr, ts[1..-1]
-    end
+    return arr, ts[1..-1] if ts[0][0] == ']'
 
     v, ts = valparse(ts)
     arr << v
 
-    if ts[0][0] == ']'
-      return arr, ts[1..-1]
-    end
+    return arr, ts[1..-1] if ts[0][0] == ']'
 
     loop do
       ts = eat(',', ts)
 
       v, ts = valparse(ts)
       arr << v
 
-      if ts[0][0] == ']'
-        return arr, ts[1..-1]
-      end
+      return arr, ts[1..-1] if ts[0][0] == ']'
     end
   end
 
-
   def eat(typ, ts)
     if ts[0][0] != typ
       raise OkJson::ParserError, "expected #{typ} (got #{ts[0].inspect})"
     end
     ts[1..-1]
   end
 
-
   # Sans s and returns a list of json tokens,
   # excluding white space (as defined in RFC 4627).
   def lex(s)
     ts = []
-    while s.length > 0
+    until s.empty?
       typ, lexeme, val = tok(s)
-      if typ == nil
-        raise OkJson::ParserError, "invalid character at #{s[0,10].inspect}"
+      if typ.nil?
+        raise OkJson::ParserError, "invalid character at #{s[0, 10].inspect}"
       end
-      if typ != :space
-        ts << [typ, lexeme, val]
-      end
+      ts << [typ, lexeme, val] if typ != :space
       s = s[lexeme.length..-1]
     end
     ts
   end
 
-
   # Scans the first token in s and
   # returns a 3-element list, or nil
   # if no such token exists.
   #
   # The first list element is one of
@@ -196,102 +167,104 @@
   # The third element is the value of the
   # token for :val and :str, otherwise
   # it is the lexeme.
   def tok(s)
     case s[0]
-    when ?{  then ['{', s[0,1], s[0,1]]
-    when ?}  then ['}', s[0,1], s[0,1]]
-    when ?:  then [':', s[0,1], s[0,1]]
-    when ?,  then [',', s[0,1], s[0,1]]
-    when ?[  then ['[', s[0,1], s[0,1]]
-    when ?]  then [']', s[0,1], s[0,1]]
-    when ?n  then nulltok(s)
-    when ?t  then truetok(s)
-    when ?f  then falsetok(s)
-    when ?"  then strtok(s)
-    when Spc then [:space, s[0,1], s[0,1]]
-    when ?\t then [:space, s[0,1], s[0,1]]
-    when ?\n then [:space, s[0,1], s[0,1]]
-    when ?\r then [:space, s[0,1], s[0,1]]
-    else          numtok(s)
+    when '{'  then ['{', s[0, 1], s[0, 1]]
+    when '}'  then ['}', s[0, 1], s[0, 1]]
+    when ':'  then [':', s[0, 1], s[0, 1]]
+    when ','  then [',', s[0, 1], s[0, 1]]
+    when '['  then ['[', s[0, 1], s[0, 1]]
+    when ']'  then [']', s[0, 1], s[0, 1]]
+    when 'n'  then nulltok(s)
+    when 't'  then truetok(s)
+    when 'f'  then falsetok(s)
+    when '"'  then strtok(s)
+    when Spc then [:space, s[0, 1], s[0, 1]]
+    when "\t" then [:space, s[0, 1], s[0, 1]]
+    when "\n" then [:space, s[0, 1], s[0, 1]]
+    when "\r" then [:space, s[0, 1], s[0, 1]]
+    else numtok(s)
     end
   end
 
+  def nulltok(s)
+    s[0, 4] == 'null'  && [:val, 'null',  nil]
+  end
 
-  def nulltok(s);  s[0,4] == 'null'  && [:val, 'null',  nil]   end
-  def truetok(s);  s[0,4] == 'true'  && [:val, 'true',  true]  end
-  def falsetok(s); s[0,5] == 'false' && [:val, 'false', false] end
+  def truetok(s)
+    s[0, 4] == 'true'  && [:val, 'true',  true]
+  end
 
+  def falsetok(s)
+    s[0, 5] == 'false' && [:val, 'false', false]
+  end
 
   def numtok(s)
     m = /-?([1-9][0-9]+|[0-9])([.][0-9]+)?([eE][+-]?[0-9]+)?/.match(s)
     if m && m.begin(0) == 0
       if m[3] && !m[2]
-        [:val, m[0], Integer(m[1])*(10**Integer(m[3][1..-1]))]
+        [:val, m[0], Integer(m[1]) * (10**Integer(m[3][1..-1]))]
       elsif m[2]
         [:val, m[0], Float(m[0])]
       else
         [:val, m[0], Integer(m[0])]
       end
     end
   end
 
-
   def strtok(s)
     m = /"([^"\\]|\\["\/\\bfnrt]|\\u[0-9a-fA-F]{4})*"/.match(s)
-    if ! m
-      raise OkJson::ParserError, "invalid string literal at #{abbrev(s)}"
-    end
+    raise OkJson::ParserError, "invalid string literal at #{abbrev(s)}" unless m
     [:str, m[0], unquote(m[0])]
   end
 
-
   def abbrev(s)
-    t = s[0,10]
+    t = s[0, 10]
     p = t['`']
-    t = t[0,p] if p
-    t = t + '...' if t.length < s.length
+    t = t[0, p] if p
+    t += '...' if t.length < s.length
     '`' + t + '`'
   end
 
-
   # Converts a quoted json string literal q into a UTF-8-encoded string.
   # The rules are different than for Ruby, so we cannot use eval.
   # Unquote will raise OkJson::ParserError, an error if q contains control characters.
   def unquote(q)
     q = q[1...-1]
     a = q.dup # allocate a big enough string
-    r, w = 0, 0
+    r = 0
+    w = 0
     while r < q.length
       c = q[r]
       case true
-      when c == ?\\
+      when c == '\\'
         r += 1
         if r >= q.length
           raise OkJson::ParserError, "string literal ends with a \"\\\": \"#{q}\""
         end
 
         case q[r]
-        when ?",?\\,?/,?'
+        when '"', '\\', '/', "'"
           a[w] = q[r]
           r += 1
           w += 1
-        when ?b,?f,?n,?r,?t
+        when 'b', 'f', 'n', 'r', 't'
           a[w] = Unesc[q[r]]
           r += 1
           w += 1
-        when ?u
+        when 'u'
           r += 1
           uchar = begin
-            hexdec4(q[r,4])
+            hexdec4(q[r, 4])
           rescue RuntimeError => e
-            raise OkJson::ParserError, "invalid escape sequence \\u#{q[r,4]}: #{e}"
+            raise OkJson::ParserError, "invalid escape sequence \\u#{q[r, 4]}: #{e}"
           end
           r += 4
           if surrogate? uchar
-            if q.length >= r+6
-              uchar1 = hexdec4(q[r+2,4])
+            if q.length >= r + 6
+              uchar1 = hexdec4(q[r + 2, 4])
               uchar = subst(uchar, uchar1)
               if uchar != Ucharerr
                 # A valid pair; consume.
                 r += 6
               end
@@ -299,66 +272,56 @@
           end
           w += ucharenc(a, w, uchar)
         else
           raise OkJson::ParserError, "invalid escape char #{q[r]} in \"#{q}\""
         end
-      when c == ?", c < Spc
+      when c == '"', c < Spc
         raise OkJson::ParserError, "invalid character in string literal \"#{q}\""
       else
         # Copy anything else byte-for-byte.
         # Valid UTF-8 will remain valid UTF-8.
         # Invalid UTF-8 will remain invalid UTF-8.
         a[w] = c
         r += 1
         w += 1
       end
     end
-    a[0,w]
+    a[0, w]
   end
 
-
   def hexdec4(s)
-    if s.length != 4
-      raise OkJson::ParserError, 'short'
-    end
-    (nibble(s[0])<<12) | (nibble(s[1])<<8) | (nibble(s[2])<<4) | nibble(s[3])
+    raise OkJson::ParserError, 'short' if s.length != 4
+    (nibble(s[0]) << 12) | (nibble(s[1]) << 8) | (nibble(s[2]) << 4) | nibble(s[3])
   end
 
-
   def subst(u1, u2)
     if Usurr1 <= u1 && u1 < Usurr2 && Usurr2 <= u2 && u2 < Usurr3
-      return ((u1-Usurr1)<<10) | (u2-Usurr2) + Usurrself
+      return ((u1 - Usurr1) << 10) | (u2 - Usurr2) + Usurrself
     end
-    return Ucharerr
+    Ucharerr
   end
 
-
   def unsubst(u)
-    if u < Usurrself || u > Umax || surrogate?(u)
-      return Ucharerr, Ucharerr
-    end
+    return Ucharerr, Ucharerr if u < Usurrself || u > Umax || surrogate?(u)
     u -= Usurrself
-    [Usurr1 + ((u>>10)&0x3ff), Usurr2 + (u&0x3ff)]
+    [Usurr1 + ((u >> 10) & 0x3ff), Usurr2 + (u & 0x3ff)]
   end
 
-
   def surrogate?(u)
     Usurr1 <= u && u < Usurr3
   end
 
-
   def nibble(c)
     case true
-    when ?0 <= c && c <= ?9 then c.ord - ?0.ord
-    when ?a <= c && c <= ?z then c.ord - ?a.ord + 10
-    when ?A <= c && c <= ?Z then c.ord - ?A.ord + 10
+    when c >= '0' && c <= '9' then c.ord - '0'.ord
+    when c >= 'a' && c <= 'z' then c.ord - 'a'.ord + 10
+    when c >= 'A' && c <= 'Z' then c.ord - 'A'.ord + 10
     else
       raise OkJson::ParserError, "invalid hex code #{c}"
     end
   end
 
-
   # Encodes x into a json text. It may contain only
   # Array, Hash, String, Numeric, true, false, nil.
   # (Note, this list excludes Symbol.)
   # Strings contained in x must be valid UTF-8.
   # Values that cannot be represented, such as
@@ -369,45 +332,42 @@
     when Hash    then objenc(x)
     when Array   then arrenc(x)
     when String  then strenc(x)
     when Numeric then numenc(x)
     when Symbol  then strenc(x.to_s)
-    when true    then "true"
-    when false   then "false"
-    when nil     then "null"
-    else              "null"
+    when true    then 'true'
+    when false   then 'false'
+    when nil     then 'null'
+    else              'null'
     end
   end
 
-
   def objenc(x)
-    '{' + x.map{|k,v| encode(k) + ':' + encode(v)}.join(',') + '}'
+    '{' + x.map { |k, v| encode(k) + ':' + encode(v) }.join(',') + '}'
   end
 
-
   def arrenc(a)
-    '[' + a.map{|x| encode(x)}.join(',') + ']'
+    '[' + a.map { |x| encode(x) }.join(',') + ']'
   end
 
-
   def strenc(s)
     t = StringIO.new
-    t.putc(?")
+    t.putc('"')
     r = 0
     while r < s.length
       case s[r]
-      when ?"  then t.print('\\"')
-      when ?\\ then t.print('\\\\')
-      when ?\b then t.print('\\b')
-      when ?\f then t.print('\\f')
-      when ?\n then t.print('\\n')
-      when ?\r then t.print('\\r')
-      when ?\t then t.print('\\t')
+      when '"'  then t.print('\\"')
+      when '\\' then t.print('\\\\')
+      when "\b" then t.print('\\b')
+      when "\f" then t.print('\\f')
+      when "\n" then t.print('\\n')
+      when "\r" then t.print('\\r')
+      when "\t" then t.print('\\t')
       else
         c = s[r]
         case true
-        when Spc <= c && c <= ?~
+        when Spc <= c && c <= '~'
           t.putc(c)
         when true
           u, size = uchardec(s, r)
           r += size - 1 # we add one more at the bottom of the loop
           if u < 0x10000
@@ -418,116 +378,110 @@
             t.print('\\u')
             hexenc4(t, u1)
             t.print('\\u')
             hexenc4(t, u2)
           end
-        else
-          # invalid byte; skip it
         end
       end
       r += 1
     end
-    t.putc(?")
+    t.putc('"')
     t.string
   end
 
-
   def hexenc4(t, u)
-    t.putc(Hex[(u>>12)&0xf])
-    t.putc(Hex[(u>>8)&0xf])
-    t.putc(Hex[(u>>4)&0xf])
-    t.putc(Hex[u&0xf])
+    t.putc(Hex[(u >> 12) & 0xf])
+    t.putc(Hex[(u >> 8) & 0xf])
+    t.putc(Hex[(u >> 4) & 0xf])
+    t.putc(Hex[u & 0xf])
   end
 
-
   def numenc(x)
-    if x.nan? || x.infinite?
-      return 'null'
-    end rescue nil
-    "#{x}"
+    begin
+      return 'null' if x.nan? || x.infinite?
+    rescue
+      nil
+    end
+    x.to_s
   end
 
-
   # Decodes unicode character u from UTF-8
   # bytes in string s at position i.
   # Returns u and the number of bytes read.
   def uchardec(s, i)
     n = s.length - i
     return [Ucharerr, 1] if n < 1
 
     c0 = s[i].ord
 
     # 1-byte, 7-bit sequence?
-    if c0 < Utagx
-      return [c0, 1]
-    end
+    return [c0, 1] if c0 < Utagx
 
     # unexpected continuation byte?
     return [Ucharerr, 1] if c0 < Utag2
 
     # need continuation byte
     return [Ucharerr, 1] if n < 2
-    c1 = s[i+1].ord
+    c1 = s[i + 1].ord
     return [Ucharerr, 1] if c1 < Utagx || Utag2 <= c1
 
     # 2-byte, 11-bit sequence?
     if c0 < Utag3
-      u = (c0&Umask2)<<6 | (c1&Umaskx)
+      u = (c0 & Umask2) << 6 | (c1 & Umaskx)
       return [Ucharerr, 1] if u <= Uchar1max
       return [u, 2]
     end
 
     # need second continuation byte
     return [Ucharerr, 1] if n < 3
-    c2 = s[i+2].ord
+    c2 = s[i + 2].ord
     return [Ucharerr, 1] if c2 < Utagx || Utag2 <= c2
 
     # 3-byte, 16-bit sequence?
     if c0 < Utag4
-      u = (c0&Umask3)<<12 | (c1&Umaskx)<<6 | (c2&Umaskx)
+      u = (c0 & Umask3) << 12 | (c1 & Umaskx) << 6 | (c2 & Umaskx)
       return [Ucharerr, 1] if u <= Uchar2max
       return [u, 3]
     end
 
     # need third continuation byte
     return [Ucharerr, 1] if n < 4
-    c3 = s[i+3].ord
+    c3 = s[i + 3].ord
     return [Ucharerr, 1] if c3 < Utagx || Utag2 <= c3
 
     # 4-byte, 21-bit sequence?
     if c0 < Utag5
-      u = (c0&Umask4)<<18 | (c1&Umaskx)<<12 | (c2&Umaskx)<<6 | (c3&Umaskx)
+      u = (c0 & Umask4) << 18 | (c1 & Umaskx) << 12 | (c2 & Umaskx) << 6 | (c3 & Umaskx)
       return [Ucharerr, 1] if u <= Uchar3max
       return [u, 4]
     end
 
-    return [Ucharerr, 1]
+    [Ucharerr, 1]
   end
 
-
   # Encodes unicode character u as UTF-8
   # bytes in string a at position i.
   # Returns the number of bytes written.
   def ucharenc(a, i, u)
     case true
     when u <= Uchar1max
       a[i] = (u & 0xff).chr
       1
     when u <= Uchar2max
-      a[i+0] = (Utag2 | ((u>>6)&0xff)).chr
-      a[i+1] = (Utagx | (u&Umaskx)).chr
+      a[i + 0] = (Utag2 | ((u >> 6) & 0xff)).chr
+      a[i + 1] = (Utagx | (u & Umaskx)).chr
       2
     when u <= Uchar3max
-      a[i+0] = (Utag3 | ((u>>12)&0xff)).chr
-      a[i+1] = (Utagx | ((u>>6)&Umaskx)).chr
-      a[i+2] = (Utagx | (u&Umaskx)).chr
+      a[i + 0] = (Utag3 | ((u >> 12) & 0xff)).chr
+      a[i + 1] = (Utagx | ((u >> 6) & Umaskx)).chr
+      a[i + 2] = (Utagx | (u & Umaskx)).chr
       3
     else
-      a[i+0] = (Utag4 | ((u>>18)&0xff)).chr
-      a[i+1] = (Utagx | ((u>>12)&Umaskx)).chr
-      a[i+2] = (Utagx | ((u>>6)&Umaskx)).chr
-      a[i+3] = (Utagx | (u&Umaskx)).chr
+      a[i + 0] = (Utag4 | ((u >> 18) & 0xff)).chr
+      a[i + 1] = (Utagx | ((u >> 12) & Umaskx)).chr
+      a[i + 2] = (Utagx | ((u >> 6) & Umaskx)).chr
+      a[i + 3] = (Utagx | (u & Umaskx)).chr
       4
     end
   end
 
   Utagx = 0x80 # 1000 0000
@@ -537,19 +491,19 @@
   Utag5 = 0xF8 # 1111 1000
   Umaskx = 0x3f # 0011 1111
   Umask2 = 0x1f # 0001 1111
   Umask3 = 0x0f # 0000 1111
   Umask4 = 0x07 # 0000 0111
-  Uchar1max = (1<<7) - 1
-  Uchar2max = (1<<11) - 1
-  Uchar3max = (1<<16) - 1
+  Uchar1max = (1 << 7) - 1
+  Uchar2max = (1 << 11) - 1
+  Uchar3max = (1 << 16) - 1
   Ucharerr = 0xFFFD # unicode "replacement char"
   Usurrself = 0x10000
   Usurr1 = 0xd800
   Usurr2 = 0xdc00
   Usurr3 = 0xe000
   Umax = 0x10ffff
 
   Spc = ' '[0]
-  Unesc = {?b=>?\b, ?f=>?\f, ?n=>?\n, ?r=>?\r, ?t=>?\t}
-  Hex = '0123456789abcdef'
+  Unesc = { 'b' => "\b", 'f' => "\f", 'n' => "\n", 'r' => "\r", 't' => "\t" }.freeze
+  Hex = '0123456789abcdef'.freeze
 end