Sha256: eb52bf57c4fc9723e482d54a250e23dfbc31724bfe882a85a7d2b55baf0e8bf9
Contents?: true
Size: 809 Bytes
Versions: 3
Compression:
Stored size: 809 Bytes
Contents
module PragmaticSegmenter module Languages class Burmese class Process < PragmaticSegmenter::Process private def sentence_boundary_punctuation(txt) PragmaticSegmenter::Languages::Burmese::SentenceBoundaryPunctuation.new(text: txt).split end def punctuation_array PragmaticSegmenter::Languages::Burmese::Punctuation.new.punct end end class SentenceBoundaryPunctuation < PragmaticSegmenter::SentenceBoundaryPunctuation SENTENCE_BOUNDARY = /.*?[။၏!\?]|.*?$/ def split text.scan(SENTENCE_BOUNDARY) end end class Punctuation < PragmaticSegmenter::Punctuation PUNCT = ['။', '၏', '?', '!'] def punct PUNCT end end end end end
Version data entries
3 entries across 3 versions & 1 rubygems