Sha256: 88747ad672d2de2ce2cc5ab9a891ba58417e16912ae7d17a12ed4897548100f0
Contents?: true
Size: 1.95 KB
Versions: 3
Compression:
Stored size: 1.95 KB
Contents
require "test/unit" require "shoulda" require "webmock/test_unit" require "yaml" require "lib/jkl" class TextCleaningTest < Test::Unit::TestCase context "Cleaning Text" do should "Remove short lines" do input = <<-HTML the cat sat on the mat a short line HTML result = Jkl::Text::remove_short_lines input assert result == "the cat sat on the mat" end should "Remove shorter lines" do input = <<-HTML the cat sat on the mat the cat sat on the slightly fluffy, yet worn and homely mat a short line HTML result = Jkl::Text::remove_short_lines(input, 8) assert result == "the cat sat on the slightly fluffy, yet worn and homely mat" end should "Remove script tags" do input = <<-HTML the cat sat on the mat <script type="text/javascript" charset="utf-8"> function nofunction(){var bob;} </script> a short line HTML result = Jkl::Text::remove_short_lines input assert result == "the cat sat on the mat" end should "Remove html comments" do input = <<-HTML the cat sat on the mat <!-- a comment--> a short line HTML result = Jkl::Text::remove_short_lines input assert result == "the cat sat on the mat" end should "Remove blank lines" do input = <<-HTML the cat sat on the mat a short line HTML result = Jkl::Text::remove_short_lines input assert result == "the cat sat on the mat" end should "Strip all tags" do input = <<-HTML <p>the cat sat on the mat</p> HTML result = Jkl::Text::strip_all_tags input assert result == "the cat sat on the mat\n" #TODO fix carriage return end should "Clean text" do input = <<-HTML the cat sat on the mat <script type="text/javascript" charset="utf-8"> function nofunction(){var bob;} </script> <p> some para stuff here </p> some end stuff here HTML result = Jkl::Text::clean input assert result == "the cat sat on the mat" end end end
Version data entries
3 entries across 3 versions & 1 rubygems
Version | Path |
---|---|
jakal-0.1.95 | test/unit/text_cleaning_test.rb |
jakal-0.1.94 | test/unit/text_cleaning_test.rb |
jakal-0.1.93 | test/unit/text_cleaning_test.rb |