Sha256: 13c0d54a30e9692d070e40563d7b1d2b6360e2e8874ddd11d1e2ddc5214fe0db

Contents?: true

Size: 765 Bytes

Versions: 13

Compression:

Stored size: 765 Bytes

Contents

require 'rbbt/sources/pubmed'

class Corpus

  NAMESPACES = {} unless defined? NAMESPACES
  NAMESPACES[:pubmed] = :add_pmid

  def add_pmid(pmid, type = nil)
    pmids = Array === pmid ? pmid : [pmid]
    type = nil if String === type and type.empty?

    PubMed.get_article(pmids).collect do |pmid, article|
      if (type.nil? and article.pdf_url.nil?) or (not type.nil? and type.to_sym === :abstract)
        add_document(article.text, :pubmed, pmid, :abstract)
      else
        raise "No FullText available for #{ pmid }" if article.pdf_url.nil?
        add_document(article.full_text, :pubmed, pmid, :fulltext)
      end
    end
  end
  
  def add_pubmed_query(query, max, type = nil)
    pmids = PubMed.query(query, max)
    add_pmid(pmids, type)
  end
end

Version data entries

13 entries across 13 versions & 1 rubygems

Version Path
rbbt-text-1.1.7 lib/rbbt/corpus/sources/pubmed.rb
rbbt-text-1.1.6 lib/rbbt/corpus/sources/pubmed.rb
rbbt-text-1.1.5 lib/rbbt/corpus/sources/pubmed.rb
rbbt-text-1.1.4 lib/rbbt/corpus/sources/pubmed.rb
rbbt-text-1.1.3 lib/rbbt/corpus/sources/pubmed.rb
rbbt-text-1.1.2 lib/rbbt/corpus/sources/pubmed.rb
rbbt-text-1.1.1 lib/rbbt/corpus/sources/pubmed.rb
rbbt-text-1.1.0 lib/rbbt/corpus/sources/pubmed.rb
rbbt-text-1.0.0 lib/rbbt/corpus/sources/pubmed.rb
rbbt-text-0.6.3 lib/rbbt/corpus/sources/pubmed.rb
rbbt-text-0.6.2 lib/rbbt/corpus/sources/pubmed.rb
rbbt-text-0.6.0 lib/rbbt/corpus/sources/pubmed.rb
rbbt-text-0.5.0 lib/rbbt/corpus/sources/pubmed.rb