# encoding: utf-8 require 'rubygems' require 'minitest/autorun' # Require implementation require File.expand_path('../../../lib/ascii85', __FILE__) describe Ascii85 do UNSUPPORTED_MSG = "This version of Ruby does not support encodings" TEST_CASES = { "" => "", " " => "<~+9~>", "\0" * 1 => "<~!!~>", "\0" * 2 => "<~!!!~>", "\0" * 3 => "<~!!!!~>", "\0" * 4 => "<~z~>", "\0" * 5 => "<~z!!~>", "A\0\0\0\0" => "<~5l^lb!!~>", # No z-abbreviation! "A" => "<~5l~>", "AB" => "<~5sb~>", "ABC" => "<~5sdp~>", "ABCD" => "<~5sdq,~>", "ABCDE" => "<~5sdq,70~>", "ABCDEF" => "<~5sdq,77I~>", "ABCDEFG" => "<~5sdq,77Kc~>", "ABCDEFGH" => "<~5sdq,77Kd<~>", "ABCDEFGHI" => "<~5sdq,77Kd<8H~>", "Ascii85" => "<~6$$OMBfIs~>", 'Antidisestablishmentarianism' => '<~6#LdYA8-*rF*(i"Ch[s(D.RU,@<-\'jDJ=0/~>', # Dōmo arigatō, Mr. Roboto (according to Wikipedia) 'どうもありがとうミスターロボット' => "<~j+42iJVN3:K&_E6j+<0KJW/W?W8iG`j+EuaK\"9on^Z0sZj+FJoK:LtSKB%T?~>", [Math::PI].pack('G') => "<~5RAV2<(&;T~>", [Math::E].pack('G') => "<~5R\"n0M\\K6,~>" } it "#decode should be the inverse of #encode" do # Generate a random string test_str = "" (1 + rand(255)).times do test_str << rand(256).chr end encoded = Ascii85.encode(test_str) decoded = Ascii85.decode(encoded) decoded.must_equal test_str end describe "#encode" do it "should encode all specified test-cases correctly" do TEST_CASES.each_pair do |input, encoded| Ascii85.encode(input).must_equal encoded end end it "should encode Strings in different encodings correctly" do unless String.new.respond_to?(:encoding) skip(UNSUPPORTED_MSG) end input_EUC_JP = 'どうもありがとうミスターロボット'.encode('EUC-JP') input_binary = input_EUC_JP.force_encoding('ASCII-8BIT') Ascii85.encode(input_EUC_JP).must_equal Ascii85.encode(input_binary) end it "should produce output lines no longer than specified" do test_str = '0123456789' * 30 # # No wrap # Ascii85.encode(test_str, false).count("\n").must_equal 0 # # x characters per line, except for the last one # x = 2 + rand(255) # < test_str.length encoded = Ascii85.encode(test_str, x) # Determine the length of all lines count_arr = [] encoded.each_line do |line| count_arr << line.chomp.length end # The last line is allowed to be shorter than x, so remove it count_arr.pop if count_arr.last <= x # If the end-marker is on a line of its own, the next-to-last line is # allowed to be shorter than specified by exactly one character count_arr.pop if (encoded[-3].chr =~ /[\r\n]/) and (count_arr.last == x-1) # Remove all line-lengths that are of length x from count_arr count_arr.delete_if { |len| len == x } # Now count_arr should be empty count_arr.must_be_empty end it "should not split the end-marker to achieve correct line length" do Ascii85.encode("\0" * 4, 4).must_equal "<~z\n~>" end end describe "#decode" do it "should decode all specified test-cases correctly" do TEST_CASES.each_pair do |decoded, input| if String.new.respond_to?(:encoding) Ascii85.decode(input).must_equal decoded.dup.force_encoding('ASCII-8BIT') else Ascii85.decode(input).must_equal decoded end end end it "should accept valid input in encodings other than the default" do unless String.new.respond_to?(:encoding) skip(UNSUPPORTED_MSG) end input = "Ragnarök τέχνη русский язык I ♥ Ruby" input_ascii85 = Ascii85.encode(input) # Try to encode input_ascii85 in all possible encodings and see if we # do the right thing in #decode. Encoding.list.each do |encoding| next if encoding.dummy? next unless encoding.ascii_compatible? # CP949 is a Microsoft Codepage for Korean, which apparently does not # include a backslash, even though #ascii_compatible? returns true. This # leads to an Ascii85::DecodingError, so we simply skip the encoding. next if encoding.name == "CP949" begin to_test = input_ascii85.encode(encoding) Ascii85.decode(to_test).force_encoding('UTF-8').must_equal input rescue Encoding::ConverterNotFoundError # Ignore this encoding end end end it "should only process data within delimiters" do Ascii85.decode("<~~>").must_be_empty Ascii85.decode("Doesn't contain delimiters").must_be_empty Ascii85.decode("Mismatched ~> delimiters 1").must_be_empty Ascii85.decode("Mismatched <~ delimiters 2").must_be_empty Ascii85.decode("Mismatched ~><~ delimiters 3").must_be_empty Ascii85.decode("<~;KZGo~><~z~>").must_equal "Ruby" Ascii85.decode("FooBar<~z~>BazQux").must_equal "\0\0\0\0" end it "should ignore whitespace" do decoded = Ascii85.decode("<~6 #LdYA\r\08\n \n\n- *rF*(i\"Ch[s \t(D.RU,@ <-\'jDJ=0\f/~>") decoded.must_equal 'Antidisestablishmentarianism' end it "should return ASCII-8BIT encoded strings" do unless String.new.respond_to?(:encoding) skip(UNSUPPORTED_MSG) end Ascii85.decode("<~;KZGo~>").encoding.name.must_equal "ASCII-8BIT" end describe "Error conditions" do it "should raise DecodingError if it encounters a word >= 2**32" do lambda { Ascii85.decode('<~s8W-#~>') }.must_raise(Ascii85::DecodingError) end it "should raise DecodingError if it encounters an invalid character" do lambda { Ascii85.decode('<~!!y!!~>') }.must_raise(Ascii85::DecodingError) end it "should raise DecodingError if the last tuple consists of a single character" do lambda { Ascii85.decode('<~!~>') }.must_raise(Ascii85::DecodingError) end it "should raise DecodingError if a z is found inside a 5-tuple" do lambda { Ascii85.decode('<~!!z!!~>') }.must_raise Ascii85::DecodingError end end end end