Sha256: 7fe84916bd29faf113313d302413b83e8b878f3543ed80d16f0804dcf0bfbc6f
Contents?: true
Size: 1.04 KB
Versions: 21
Compression:
Stored size: 1.04 KB
Contents
# -*- encoding : utf-8 -*- module PragmaticSegmenter # This class searches for periods within an abbreviation and # replaces the periods. class SingleLetterAbbreviation # Rubular: http://rubular.com/r/e3H6kwnr6H SingleUpperCaseLetterAtStartOfLineRule = Rule.new(/(?<=^[A-Z])\.(?=\s)/, '∯') # Rubular: http://rubular.com/r/gitvf0YWH4 SingleUpperCaseLetterRule = Rule.new(/(?<=\s[A-Z])\.(?=\s)/, '∯') attr_reader :text def initialize(text:) @text = text end def replace @formatted_text = replace_single_letter_abbreviations(text) end private def replace_single_letter_abbreviations(txt) new_text = replace_single_uppercase_letter_abbreviation_at_start_of_line(txt) replace_single_uppercase_letter_abbreviation(new_text) end def replace_single_uppercase_letter_abbreviation_at_start_of_line(txt) txt.apply(SingleUpperCaseLetterAtStartOfLineRule) end def replace_single_uppercase_letter_abbreviation(txt) txt.apply(SingleUpperCaseLetterRule) end end end
Version data entries
21 entries across 21 versions & 1 rubygems
Version | Path |
---|---|
pragmatic_segmenter-0.0.1 | lib/pragmatic_segmenter/single_letter_abbreviation.rb |