spec/break_iterator_spec.rb in ffi-icu-0.0.6 vs spec/break_iterator_spec.rb in ffi-icu-0.0.7

- old
+ new

@@ -16,10 +16,24 @@ iterator = BreakIterator.new :word, "en_US" iterator.text = "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua." iterator.to_a.should == [0, 5, 6, 11, 12, 17, 18, 21, 22, 26, 27, 28, 39, 40, 51, 52, 56, 57, 58, 61, 62, 64, 65, 72, 73, 79, 80, 90, 91, 93, 94, 100, 101, 103, 104, 110, 111, 116, 117, 123, 124] end - it "finds all word boundaries in a Thai string" do + it "returns each substring" do + iterator = BreakIterator.new :word, "en_US" + iterator.text = "Lorem ipsum dolor sit amet." + + iterator.substrings.should == ["Lorem", " ", "ipsum", " ", "dolor", " ", "sit", " ", "amet", "."] + end + + it "returns the substrings of a non-ASCII string" do + iterator = BreakIterator.new :word, "th_TH" + iterator.text = "รู้อะไรไม่สู้รู้วิชา รู้รักษาตัวรอดเป็นยอดดี" + + iterator.substrings.should == ["รู้", "อะไร", "ไม่สู้", "รู้", "วิชา", " ", "รู้", "รักษา", "ตัว", "รอด", "เป็น", "ยอดดี"] + end + + it "finds all word boundaries in a non-ASCII string" do iterator = BreakIterator.new :word, "th_TH" iterator.text = "การทดลอง" iterator.to_a.should == [0, 3, 8] end