Sha256: f01f04c576f12fc94897bd06bdacbfea44402e7cd82236b1871a3e778346f31f
Contents?: true
Size: 1.86 KB
Versions: 1
Compression:
Stored size: 1.86 KB
Contents
require "json" require "rest_client" require "calais" module Jkl def self.get_from_calais(content) begin license_id = YAML::load_file('config/keys.yml')['calais'] c_uri = URI.parse('http://api.opencalais.com/enlighten/rest/') post_args = { 'licenseID' => license_id, 'content' => content, 'paramsXML' => paramsXML('application/json') } post_to(c_uri, post_args) rescue Exception => e puts e end end def self.get_tag_from_json(response) result = JSON.parse response result.delete_if {|key, value| key == "doc" } # ditching the doc cleaned_result = [] result.each do |key,tag| tag = Jkl::clean_unwanted_items_from_hash tag cleaned_result << tag yield tag if block_given? end cleaned_result end def self.get_calais_metadata(key, text) name_value_pairs = Jkl::tags(key, text).entities.map{|e| {e.type => [e.attributes["name"]]}} nested_list = {} name_value_pairs.each { |a| nested_list = nested_list.merge!(a){ |key,v1,v2| v1+v2 }} nested_list end #jkl doesn't work with these aspects of the calais response, also removing blanks def self.clean_unwanted_items_from_hash h h.delete_if {|k, v| k == "relevance" } h.delete_if {|k, v| k == "instances" } h.delete_if {|k, v| v == "N/A"} h.delete_if {|k, v| v == []} h.delete_if {|k, v| v == ""} h.delete_if {|k, v| k == "_typeGroup"} h end private def self.paramsXML(format) <<-paramsXML; <c:params xmlns:c="http://s.opencalais.com/1/pred/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"> <c:processingDirectives c:contentType="text/txt" c:outputFormat="#{format}"> </c:processingDirectives> <c:userDirectives /> <c:externalMetadata /> </c:params> paramsXML end end
Version data entries
1 entries across 1 versions & 1 rubygems
Version | Path |
---|---|
jakal-0.0.9 | lib/jkl/calais_client.rb |