spec/break_iterator_spec.rb in ffi-icu-0.0.6 vs spec/break_iterator_spec.rb in ffi-icu-0.0.7
- old
+ new
@@ -16,10 +16,24 @@
iterator = BreakIterator.new :word, "en_US"
iterator.text = "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do eiusmod tempor incididunt ut labore et dolore magna aliqua."
iterator.to_a.should == [0, 5, 6, 11, 12, 17, 18, 21, 22, 26, 27, 28, 39, 40, 51, 52, 56, 57, 58, 61, 62, 64, 65, 72, 73, 79, 80, 90, 91, 93, 94, 100, 101, 103, 104, 110, 111, 116, 117, 123, 124]
end
- it "finds all word boundaries in a Thai string" do
+ it "returns each substring" do
+ iterator = BreakIterator.new :word, "en_US"
+ iterator.text = "Lorem ipsum dolor sit amet."
+
+ iterator.substrings.should == ["Lorem", " ", "ipsum", " ", "dolor", " ", "sit", " ", "amet", "."]
+ end
+
+ it "returns the substrings of a non-ASCII string" do
+ iterator = BreakIterator.new :word, "th_TH"
+ iterator.text = "รู้อะไรไม่สู้รู้วิชา รู้รักษาตัวรอดเป็นยอดดี"
+
+ iterator.substrings.should == ["รู้", "อะไร", "ไม่สู้", "รู้", "วิชา", " ", "รู้", "รักษา", "ตัว", "รอด", "เป็น", "ยอดดี"]
+ end
+
+ it "finds all word boundaries in a non-ASCII string" do
iterator = BreakIterator.new :word, "th_TH"
iterator.text = "การทดลอง"
iterator.to_a.should == [0, 3, 8]
end