Sha256: a538604320570e76b653accb9587b10ba526e33cc6758f0f9b8daacc7a07986e

Contents?: true

Size: 1.17 KB

Versions: 9

Compression:

Stored size: 1.17 KB

Contents

module PragmaticSegmenter
  module Languages
    module Bulgarian
      include Languages::Common

      module Abbreviation
        ABBREVIATIONS = Set.new(["p.s", "акад", "ал", "б.р", "б.ред", "бел.а", "бел.пр", "бр", "бул", "в", "вж", "вкл", "вм", "вр", "г", "ген", "гр", "дж", "дм", "доц", "др", "ем", "заб", "зам", "инж", "к.с", "кв", "кв.м", "кг", "км", "кор", "куб", "куб.м", "л", "лв", "м", "м.г", "мин", "млн", "млрд", "мм", "н.с", "напр", "пл", "полк", "проф", "р", "рис", "с", "св", "сек", "см", "сп", "срв", "ст", "стр", "т", "т.г", "т.е", "т.н", "т.нар", "табл", "тел", "у", "ул", "фиг", "ха", "хил", "ч", "чл", "щ.д"]).freeze
        NUMBER_ABBREVIATIONS = [].freeze
        PREPOSITIVE_ABBREVIATIONS = [].freeze
      end

      class AbbreviationReplacer < AbbreviationReplacer
        SENTENCE_STARTERS = [].freeze

        private
        def replace_period_of_abbr(txt, abbr)
          txt.gsub!(/(?<=\s#{abbr.strip})\.|(?<=^#{abbr.strip})\./, '∯')
          txt
        end
      end
    end
  end
end

Version data entries

9 entries across 9 versions & 1 rubygems

Version Path
pragmatic_segmenter-0.3.17 lib/pragmatic_segmenter/languages/bulgarian.rb
pragmatic_segmenter-0.3.16 lib/pragmatic_segmenter/languages/bulgarian.rb
pragmatic_segmenter-0.3.15 lib/pragmatic_segmenter/languages/bulgarian.rb
pragmatic_segmenter-0.3.14 lib/pragmatic_segmenter/languages/bulgarian.rb
pragmatic_segmenter-0.3.13 lib/pragmatic_segmenter/languages/bulgarian.rb
pragmatic_segmenter-0.3.12 lib/pragmatic_segmenter/languages/bulgarian.rb
pragmatic_segmenter-0.3.10 lib/pragmatic_segmenter/languages/bulgarian.rb
pragmatic_segmenter-0.3.9 lib/pragmatic_segmenter/languages/bulgarian.rb
pragmatic_segmenter-0.3.8 lib/pragmatic_segmenter/languages/bulgarian.rb