Sha256: 6ef9f07e5d754bdf5148f8150479cd148472d8bb5c72e38256bad41b04298baf

Contents?: true

Size: 859 Bytes

Versions: 2

Compression:

Stored size: 859 Bytes

Contents

require File.join(File.expand_path(File.dirname(__FILE__)), '../../../..', 'test_helper.rb')
require 'rbbt/text/document'
require 'rbbt/text/corpus'
require 'rbbt/text/corpus/sources/pmid'

class TestCorpusPMID < Test::Unit::TestCase
  def setup
    Log.severity = 0
    Document.corpus = Corpus.new Rbbt.tmp.test.document_corpus

    Corpus::Document.define :words do
      words = self.text.split(" ")
      Segment.align(self.text, words)
    end

    Corpus::Document.define :genes do
      require 'rbbt/ner/banner'
      Banner.new.match(self.text)
    end

    Corpus::Document.persist_in_global_tsv("genes")
    Corpus::Document.persist_in_global_tsv(:words)
  end

  def test_query
    docids = Document.corpus.add_pubmed_query("SARS-Cov-2", 2000, :abstract)

    docids.each do |docid|
      iif Document.corpus.docid(docid).text
    end
  end
end

Version data entries

2 entries across 2 versions & 1 rubygems

Version Path
rbbt-text-1.2.0 test/rbbt/text/corpus/sources/test_pmid.rb
rbbt-text-1.1.9 test/rbbt/text/corpus/sources/test_pmid.rb