Sha256: c7d3d575de7ef2c391273595c729787bdaa35275905592c2bdf1071b6641b293

Contents?: true

Size: 1.25 KB

Versions: 9

Compression:

Stored size: 1.25 KB

Contents

module PragmaticSegmenter
  module Languages
    module Russian
      include Languages::Common

      module Abbreviation
        ABBREVIATIONS = Set.new(["y", "y.e", "а", "авт", "адм.-терр", "акад", "в", "вв", "вкз", "вост.-европ", "г", "гг", "гос", "гр", "д", "деп", "дисс", "дол", "долл", "ежедн", "ж", "жен", "з", "зап", "зап.-европ", "заруб", "и", "ин", "иностр", "инст", "к", "канд", "кв", "кг", "куб", "л", "л.h", "л.н", "м", "мин", "моск", "муж", "н", "нед", "о", "п", "пгт", "пер", "пп", "пр", "просп", "проф", "р", "руб", "с", "сек", "см", "спб", "стр", "т", "тел", "тов", "тт", "тыс", "у", "у.е", "ул", "ф", "ч"]).freeze
        PREPOSITIVE_ABBREVIATIONS = [].freeze
        NUMBER_ABBREVIATIONS = [].freeze
      end

      class AbbreviationReplacer < AbbreviationReplacer
        SENTENCE_STARTERS = [].freeze

        private

        def replace_period_of_abbr(txt, abbr)
          txt.gsub!(/(?<=\s#{abbr.strip})\./, '∯')
          txt.gsub!(/(?<=\A#{abbr.strip})\./, '∯')
          txt.gsub!(/(?<=^#{abbr.strip})\./, '∯')
          txt
        end
      end
    end
  end
end

Version data entries

9 entries across 9 versions & 1 rubygems

Version Path
pragmatic_segmenter-0.3.17 lib/pragmatic_segmenter/languages/russian.rb
pragmatic_segmenter-0.3.16 lib/pragmatic_segmenter/languages/russian.rb
pragmatic_segmenter-0.3.15 lib/pragmatic_segmenter/languages/russian.rb
pragmatic_segmenter-0.3.14 lib/pragmatic_segmenter/languages/russian.rb
pragmatic_segmenter-0.3.13 lib/pragmatic_segmenter/languages/russian.rb
pragmatic_segmenter-0.3.12 lib/pragmatic_segmenter/languages/russian.rb
pragmatic_segmenter-0.3.10 lib/pragmatic_segmenter/languages/russian.rb
pragmatic_segmenter-0.3.9 lib/pragmatic_segmenter/languages/russian.rb
pragmatic_segmenter-0.3.8 lib/pragmatic_segmenter/languages/russian.rb