Sha256: 336fbd5aabb2c90e8be8db5b3be056c438fa81a86cf0e79ec2a84801a6b25477
Contents?: true
Size: 1.74 KB
Versions: 2
Compression:
Stored size: 1.74 KB
Contents
require "json" require "rest_client" require "calais" module Jkl def self.get_from_calais(content) begin license_id = YAML::load_file('config/keys.yml')['calais'] c_uri = URI.parse('http://api.opencalais.com/enlighten/rest/') post_args = { 'licenseID' => license_id, 'content' => content, 'paramsXML' => paramsXML('application/json') } post_to(c_uri, post_args) rescue Exception => e puts e end end def self.get_tag_from_json(response) result = JSON.parse response result.delete_if {|key, value| key == "doc" } # ditching the doc cleaned_result = [] result.each do |key,tag| tag = Jkl::clean_unwanted_items_from_hash tag cleaned_result << tag yield tag if block_given? end cleaned_result end def self.get_calais_metadata(response) #ce = CalaisExtractor.new( response ) #ce.prettify #TODO work out how to implement this end #jkl doesn't work with these aspects of the calais response, also removing blanks def self.clean_unwanted_items_from_hash h h.delete_if {|k, v| k == "relevance" } h.delete_if {|k, v| k == "instances" } h.delete_if {|k, v| v == "N/A"} h.delete_if {|k, v| v == []} h.delete_if {|k, v| v == ""} h.delete_if {|k, v| k == "_typeGroup"} h end private def self.paramsXML(format) <<-paramsXML; <c:params xmlns:c="http://s.opencalais.com/1/pred/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"> <c:processingDirectives c:contentType="text/txt" c:outputFormat="#{format}"> </c:processingDirectives> <c:userDirectives /> <c:externalMetadata /> </c:params> paramsXML end end
Version data entries
2 entries across 2 versions & 1 rubygems
Version | Path |
---|---|
jakal-0.0.8 | lib/jkl/calais_client.rb |
jakal-0.0.7 | lib/jkl/calais_client.rb |