Sha256: d839ea21da863c640e38cb887773b30f152c87a77bbe3658a498ae0ff89f3f79
Contents?: true
Size: 1.92 KB
Versions: 1
Compression:
Stored size: 1.92 KB
Contents
module WWW class Mechanize class Util CODE_DIC = { :JIS => "ISO-2022-JP", :EUC => "EUC-JP", :SJIS => "SHIFT_JIS", :UTF8 => "UTF-8", :UTF16 => "UTF-16", :UTF32 => "UTF-32"} class << self def build_query_string(parameters, enc=nil) parameters.map { |k,v| if k # WEBrick::HTTP.escape* has some problems about m17n on ruby-1.9.*. [URI.escape(k.to_s), URI.escape(v.to_s)].join("=") =begin [WEBrick::HTTPUtils.escape_form(k.to_s), WEBrick::HTTPUtils.escape_form(v.to_s)].join("=") =end end }.compact.join('&') end def to_native_charset(s, code=nil) if Mechanize.html_parser == Nokogiri::HTML return unless s code ||= detect_charset(s) Iconv.iconv("UTF-8", code, s).join("") else s end end def from_native_charset(s, code) if Mechanize.html_parser == Nokogiri::HTML return unless s Iconv.iconv(code, "UTF-8", s).join("") else return s end end def html_unescape(s) return s unless s s.gsub(/&(\w+|#[0-9]+);/) { |match| number = case match when /&(\w+);/ Mechanize.html_parser::NamedCharacters[$1] when /&#([0-9]+);/ $1.to_i end number ? ([number].pack('U') rescue match) : match } end def detect_charset(src) tmp = NKF.guess(src || "<html></html>") if RUBY_VERSION >= "1.9.0" enc = tmp.to_s.upcase else enc = NKF.constants.find{|c| NKF.const_get(c) == tmp } enc = CODE_DIC[enc.intern] end enc || "ISO-8859-1" end end end end end
Version data entries
1 entries across 1 versions & 1 rubygems
Version | Path |
---|---|
mechanize-0.9.1 | lib/www/mechanize/util.rb |