Sha256: 81f7591affd3c0fc5149d8da943a8caa80b3a73ea793c69fe5009d35d9a8e487

Contents?: true

Size: 1.35 KB

Versions: 7

Compression:

Stored size: 1.35 KB

Contents

require File.join(File.expand_path(File.dirname(__FILE__)), '../../..', 'test_helper.rb')
require 'rbbt/nlp/genia/sentence_splitter'

class TestNLP < Test::Unit::TestCase
  def test_sentences
    text =<<-EOF
This is a sentence.    
A funky character ™ in a sentence.
This is a sentence.    
This is a broken
sentence. This is
another broken sentence. 
    EOF

    assert_equal "This is a broken\nsentence.", NLP.geniass_sentence_splitter(text)[2].strip
  end

  def test_sentences_2
    text =<<-EOF
This is a sentence.    
This is a sentence.    
This is a broken
sentence. This is
another broken sentence. 
    EOF

    assert_equal "This is a broken\nsentence.", NLP.geniass_sentence_splitter(text)[2].strip
  end

  def test_sentences_ext
    text =<<-EOF
This is a sentence.    
This is a sentence.    
This is a broken
sentence. This is
another broken sentence. 
    EOF

    Log.with_severity 0 do
      assert_equal "This is a broken\nsentence.", NLP.geniass_sentence_splitter_extension(text)[2].strip
    end
  end

  def test_sentence_cmi
    text =<<-EOF
The COVID-19 infection was reported as the main cause of death and patients with a higher mortality risk were those aged ≥65 years [adjusted HR = 3.40 (95% CI 2.20-5.24)], with a higher disease severity [adjusted HR = 1.87 (95%CI 1.43-2.45)].
    EOF

    iii NLP.geniass_sentence_splitter(text)
  end
end

Version data entries

7 entries across 7 versions & 1 rubygems

Version Path
rbbt-text-1.5.2 test/rbbt/nlp/genia/test_sentence_splitter.rb
rbbt-text-1.5.1 test/rbbt/nlp/genia/test_sentence_splitter.rb
rbbt-text-1.5.0 test/rbbt/nlp/genia/test_sentence_splitter.rb
rbbt-text-1.4.0 test/rbbt/nlp/genia/test_sentence_splitter.rb
rbbt-text-1.3.11 test/rbbt/nlp/genia/test_sentence_splitter.rb
rbbt-text-1.3.10 test/rbbt/nlp/genia/test_sentence_splitter.rb
rbbt-text-1.3.9 test/rbbt/nlp/genia/test_sentence_splitter.rb