Sha256: 8227027a35ba5c2d2afd4c3ac5f51cfe26a7677e3d0406ae270a98e6569240bf
Contents?: true
Size: 1.7 KB
Versions: 1
Compression:
Stored size: 1.7 KB
Contents
require File.join(File.expand_path(File.dirname(__FILE__)), '../../..', 'test_helper.rb') require 'rbbt/text/corpus/document' class TestCorpusDocument < Test::Unit::TestCase def setup Log.severity = 0 Corpus::Document.define :words do words = self.text.split(" ") Segment.align(self.text, words) end Open.mkdir Rbbt.tmp.test.annotations.find Corpus::Document.persist_in_global_tsv(:words, Rbbt.tmp.test.anotations.words.find) Corpus::Document.define_multiple :words2 do |documents| documents.collect do |doc| words = doc.text.split(" ") Segment.align(doc.text, words) end end Corpus::Document.persist_in_global_tsv(:words2, Rbbt.tmp.test.anotations.counts.find) end def test_words text = "This is a test document" document = Corpus::Document.new(Rbbt.tmp.test.persist, "TEST:test_doc", text) assert_equal Segment.sort(document.words), text.split(" ") end def test_words_multiple document1 = Corpus::Document.new(Rbbt.tmp.test.persist, "TEST:test_doc:1", "This is a test document") document2 = Corpus::Document.new(Rbbt.tmp.test.persist, "TEST:test_doc2:2", "This is a another test document") docs = [document1, document2] Corpus::Document.prepare_multiple(docs, :words2) assert_equal document1.words2, document1.text.split(" ") assert_equal document2.words2, document2.text.split(" ") document1 = Corpus::Document.new(Rbbt.tmp.test.persist, "TEST:test_doc:1", "This is a test document") document2 = Corpus::Document.new(Rbbt.tmp.test.persist, "TEST:test_doc2:2", "This is a another test document") docs = [document1, document2] Corpus::Document.prepare_multiple(docs, :words2) end end
Version data entries
1 entries across 1 versions & 1 rubygems
Version | Path |
---|---|
rbbt-text-1.1.9 | test/rbbt/text/corpus/test_document.rb |