Sha256: 6b42aeb452e7ca793f68811c605c69bfad700fa468f82566ff111013aadfb2f0
Contents?: true
Size: 1.72 KB
Versions: 2
Compression:
Stored size: 1.72 KB
Contents
require File.join(File.expand_path(File.dirname(__FILE__)), '../..', 'test_helper.rb') require 'rbbt/text/document' require 'rbbt/text/corpus/sources/pmid' class TestDocument < Test::Unit::TestCase def setup Log.severity = 0 Document.corpus = Corpus.new Rbbt.tmp.test.document_corpus Corpus::Document.define :words do words = self.text.split(" ") Segment.align(self.text, words) end Corpus::Document.define :genes do require 'rbbt/ner/banner' Banner.new.match(self.text) end Corpus::Document.persist_in_global_tsv("genes") Corpus::Document.persist_in_global_tsv(:words) end def test_title_and_text document = Document.setup('PMID:32272262') assert document.text.downcase.include?("covid") assert_equal "High-resolution Chest CT Features and Clinical Characteristics of Patients Infected with COVID-19 in Jiangsu, China.", document.title end def test_full_text document = Document.setup('PMID:4304705') assert document.text.length < document.full_text.length end def test_words document = Document.setup('PMID:32272262') words = document.entities :words assert words.first.respond_to?(:offset) end def test_genes text = "This is a mention to TP53, a gene that should be found" document = Document.setup(Document.corpus.add_document(text, "TEST")) genes = document.entities :genes assert_equal "TP53", genes.first assert genes.first.respond_to?(:offset) text = "This is a mention to TP53, a gene that should be found" document = Document.setup(Document.corpus.add_document(text, "TEST")) genes = document.entities :genes assert_equal "TP53", genes.first assert genes.first.respond_to?(:offset) end end
Version data entries
2 entries across 2 versions & 1 rubygems
Version | Path |
---|---|
rbbt-text-1.2.0 | test/rbbt/text/test_document.rb |
rbbt-text-1.1.9 | test/rbbt/text/test_document.rb |