module WWW class Mechanize # =Synopsis # GlobalForm provides all access to form fields, such as the buttons, # check boxes, and text input. # # GlobalForm takes two nodes, the node where the form tag is located # (form_node), and another node, from which to start looking for form # elements (elements_node) like buttons and the like. For class Form # both fall together into one and the same node. # # Class Form does not work in the case there is some invalid (unbalanced) # html involved, such as: # # #
# # # #
# # class GlobalForm attr_reader :form_node, :elements_node attr_accessor :method, :action, :name attr_finder :fields, :buttons, :file_uploads, :radiobuttons, :checkboxes attr_reader :enctype def initialize(form_node, elements_node) @form_node, @elements_node = form_node, elements_node @method = (@form_node.attributes['method'] || 'GET').upcase @action = @form_node.attributes['action'] @name = @form_node.attributes['name'] @enctype = @form_node.attributes['enctype'] || 'application/x-www-form-urlencoded' @clicked_buttons = [] parse end # In the case of malformed HTML, fields of multiple forms might occure in this forms' # field array. If the fields have the same name, posterior fields overwrite former fields. # To avoid this, this method rejects all posterior duplicate fields. def uniq_fields! names_in = {} fields.reject! {|f| if names_in.include?(f.name) true else names_in[f.name] = true false end } end # This method builds an array of arrays that represent the query # parameters to be used with this form. The return value can then # be used to create a query string for this form. def build_query(buttons = []) query = [] fields().each do |f| next unless f.value query.push(*f.query_value) end checkboxes().each do |f| query.push(*f.query_value) if f.checked end radio_groups = {} radiobuttons().each do |f| radio_groups[f.name] ||= [] radio_groups[f.name] << f end # take one radio button from each group radio_groups.each_value do |g| checked = g.select {|f| f.checked} if checked.size == 1 f = checked.first query.push(*f.query_value) elsif checked.size > 1 raise "multiple radiobuttons are checked in the same group!" end end @clicked_buttons.each { |b| query.push(*b.query_value) } query end # This method adds a button to the query. If the form needs to be # submitted with multiple buttons, pass each button to this method. def add_button_to_query(button) @clicked_buttons << button end # This method calculates the request data to be sent back to the server # for this form, depending on if this is a regular post, get, or a # multi-part post, def request_data query_params = build_query() query = nil case @enctype.downcase when 'multipart/form-data' boundary = rand_string(20) @enctype << "; boundary=#{boundary}" params = [] query_params.each { |k,v| params << param_to_multipart(k, v) } @file_uploads.each { |f| params << file_to_multipart(f) } query = params.collect { |p| "--#{boundary}\r\n#{p}" }.join('') + "--#{boundary}--\r\n" else query = WWW::Mechanize.build_query_string(query_params) end query end def inspect "Form: ['#{@name}' #{@method} #{@action}]" end private def parse @fields = WWW::Mechanize::List.new @buttons = WWW::Mechanize::List.new @file_uploads = WWW::Mechanize::List.new @radiobuttons = WWW::Mechanize::List.new @checkboxes = WWW::Mechanize::List.new @elements_node.each_recursive {|node| type = (node.attributes['type'] || 'text').downcase # Don't add fields that don't have a name next if type != 'submit' && node.attributes['name'].nil? case node.name.downcase when 'input' case type when 'text', 'password', 'hidden', 'int' @fields << Field.new(node.attributes['name'], node.attributes['value'] || '') when 'radio' @radiobuttons << RadioButton.new(node.attributes['name'], node.attributes['value'], node.attributes.has_key?('checked')) when 'checkbox' @checkboxes << CheckBox.new(node.attributes['name'], node.attributes['value'], node.attributes.has_key?('checked')) when 'file' @file_uploads << FileUpload.new(node.attributes['name'], node.attributes['value']) when 'submit' @buttons << Button.new(node.attributes['name'], node.attributes['value']) when 'image' @buttons << ImageButton.new(node.attributes['name'], node.attributes['value']) end when 'textarea' @fields << Field.new(node.attributes['name'], node.all_text) when 'select' if node.attributes.has_key? 'multiple' @fields << MultiSelectList.new(node.attributes['name'], node) else @fields << SelectList.new(node.attributes['name'], node) end end } end def rand_string(len = 10) chars = ("a".."z").to_a + ("A".."Z").to_a string = "" 1.upto(len) { |i| string << chars[rand(chars.size-1)] } string end def mime_value_quote(str) str.gsub(/(["\r\\])/){|s| '\\' + s} end def param_to_multipart(name, value) return "Content-Disposition: form-data; name=\"" + "#{mime_value_quote(name)}\"\r\n" + "\r\n#{value}\r\n" end def file_to_multipart(file) body = "Content-Disposition: form-data; name=\"" + "#{mime_value_quote(file.name)}\"; " + "filename=\"#{mime_value_quote(file.file_name || '')}\"\r\n" + "Content-Transfer-Encoding: binary\r\n" if file.mime_type != nil body << "Content-Type: #{file.mime_type}\r\n" end body << "\r\n#{file.file_data}\r\n" body end end # =Synopsis # This class encapsulates a form parsed out of an HTML page. Each type # of input fields available in a form can be accessed through this object. # See GlobalForm for more methods. # # ==Example # Find a form and print out its fields # form = page.forms.first # => WWW::Mechanize::Form # form.fields.each { |f| puts f.name } class Form < GlobalForm attr_reader :node def initialize(node) @node = node super(@node, @node) end # Fetch the first field whose name is equal to field_name def field(field_name) fields.find { |f| f.name.eql? field_name } end # This method sets multiple fields on the form. It takes a list of field # name, value pairs. If there is more than one field found with the # same name, this method will set the first one found. If you want to # set the value of a duplicate field, use a value which is an Array with # the second value of the array as the index in to the form. The index # is zero based. For example, to set the second field named 'foo', you # could do the following: # form.set_fields( :foo => ['bar', 1] ) def set_fields(fields = {}) fields.each do |k,v| value = nil index = 0 v.each do |val| index = val.to_i unless value.nil? value = val if value.nil? end self.fields.name(k.to_s).[](index).value = value end end # Treat form fields like accessors. def method_missing(id,*args) method = id.to_s.gsub(/=$/, '') if field(method) return field(method).value if args.empty? return field(method).value = args[0] end super end end end end