Sha256: 600854cb8362497f22d92fc9d3fac6d2a6341320770548fbfea7bd13a2f91ed1

Contents?: true

Size: 1.6 KB

Versions: 62

Compression:

Stored size: 1.6 KB

Contents

# frozen_string_literal: true

module Onebox
  module Engine
    class PubmedOnebox
      include Engine
      include LayoutSupport

      matches_regexp Regexp.new("^https?://(?:(?:\\w)+\\.)?(www.ncbi.nlm.nih)\\.gov(?:/)?/pubmed/\\d+")

      private

      def get_xml
        doc = Nokogiri::XML(open(URI.join(@url, "?report=xml&format=text")))
        pre = doc.xpath("//pre")
        Nokogiri::XML("<root>" + pre.text + "</root>")
      end

      def authors_of_xml(xml)
        initials = xml.css("Initials").map { |x| x.content }
        last_names = xml.css("LastName").map { |x| x.content }
        author_list = (initials.zip(last_names)).map { |i, l| i + " " + l }
        if author_list.length > 1 then
          author_list[-2] = author_list[-2] + " and " + author_list[-1]
          author_list.pop
        end
        author_list.join(", ")
      end

      def date_of_xml(xml)
        date_arr = (xml.css("PubDate").children).map { |x| x.content }
        date_arr = date_arr.select { |s| !s.match(/^\s+$/) }
        date_arr = (date_arr.map { |s| s.split }).flatten
        date_arr.sort.reverse.join(" ") # Reverse sort so month before year.
      end

      def data
        xml = get_xml()
        {
          title: xml.css("ArticleTitle").text,
          authors: authors_of_xml(xml),
          journal: xml.css("Title").text,
          abstract: xml.css("AbstractText").text,
          date: date_of_xml(xml),
          link: @url,
          pmid: match[:pmid]
        }
      end

      def match
        @match ||= @url.match(%r{www\.ncbi\.nlm\.nih\.gov/pubmed/(?<pmid>[0-9]+)})
      end
    end
  end
end

Version data entries

62 entries across 62 versions & 1 rubygems

Version Path
onebox-2.2.2 lib/onebox/engine/pubmed_onebox.rb
onebox-2.2.1 lib/onebox/engine/pubmed_onebox.rb
onebox-2.2.0 lib/onebox/engine/pubmed_onebox.rb
onebox-2.1.9 lib/onebox/engine/pubmed_onebox.rb
onebox-2.1.8 lib/onebox/engine/pubmed_onebox.rb
onebox-2.1.7 lib/onebox/engine/pubmed_onebox.rb
onebox-2.1.6 lib/onebox/engine/pubmed_onebox.rb
onebox-2.1.5 lib/onebox/engine/pubmed_onebox.rb
onebox-2.1.4 lib/onebox/engine/pubmed_onebox.rb
onebox-2.1.3 lib/onebox/engine/pubmed_onebox.rb
onebox-2.1.2 lib/onebox/engine/pubmed_onebox.rb
onebox-2.1.1 lib/onebox/engine/pubmed_onebox.rb
onebox-2.1.0 lib/onebox/engine/pubmed_onebox.rb
onebox-2.0.2 lib/onebox/engine/pubmed_onebox.rb
onebox-2.0.1 lib/onebox/engine/pubmed_onebox.rb
onebox-2.0.0 lib/onebox/engine/pubmed_onebox.rb
onebox-1.9.30 lib/onebox/engine/pubmed_onebox.rb
onebox-1.9.29 lib/onebox/engine/pubmed_onebox.rb
onebox-1.9.28.4 lib/onebox/engine/pubmed_onebox.rb
onebox-1.9.28.3 lib/onebox/engine/pubmed_onebox.rb