Sha256: c41adecf74fdc0030a273f61a2537cbdf386946f5dc1f5ee445a7ad3f28c184c

Contents?: true

Size: 1.23 KB

Versions: 10

Compression:

Stored size: 1.23 KB

Contents

module PragmaticTokenizer
  module Languages
    module Catalan
      include Languages::Common
      ABBREVIATIONS = [].freeze
      STOP_WORDS = ["a", "abans", "algun", "alguna", "algunes", "alguns", "altre", "amb", "ambdós", "anar", "ans", "aquell", "aquelles", "aquells", "aquí", "bastant", "bé", "cada", "com", "consegueixo", "conseguim", "conseguir", "consigueix", "consigueixen", "consigueixes", "dalt", "de", "des de", "dins", "el", "elles", "ells", "els", "en", "ens", "entre", "era", "erem", "eren", "eres", "es", "és", "éssent", "està", "estan", "estat", "estava", "estem", "esteu", "estic", "ets", "fa", "faig", "fan", "fas", "fem", "fer", "feu", "fi", "haver", "i", "inclòs", "jo", "la", "les", "llarg", "llavors", "mentre", "meu", "mode", "molt", "molts", "nosaltres", "o", "on", "per", "per que", "però", "perquè", "podem", "poden", "poder", "podeu", "potser", "primer", "puc", "quan", "quant", "qui", "sabem", "saben", "saber", "sabeu", "sap", "saps", "sense", "ser", "seu", "seus", "si", "soc", "solament", "sols", "som", "sota", "també", "te", "tene", "tenim", "tenir", "teniu", "teu", "tinc", "tot", "últim", "un", "una", "unes", "uns", "ús", "va", "vaig", "van", "vosaltres"].freeze
      CONTRACTIONS = {}.freeze
    end
  end
end

Version data entries

10 entries across 10 versions & 1 rubygems

Version Path
pragmatic_tokenizer-1.4.0 lib/pragmatic_tokenizer/languages/catalan.rb
pragmatic_tokenizer-1.3.1 lib/pragmatic_tokenizer/languages/catalan.rb
pragmatic_tokenizer-1.3.0 lib/pragmatic_tokenizer/languages/catalan.rb
pragmatic_tokenizer-1.2.0 lib/pragmatic_tokenizer/languages/catalan.rb
pragmatic_tokenizer-1.1.2 lib/pragmatic_tokenizer/languages/catalan.rb
pragmatic_tokenizer-1.1.1 lib/pragmatic_tokenizer/languages/catalan.rb
pragmatic_tokenizer-1.1.0 lib/pragmatic_tokenizer/languages/catalan.rb
pragmatic_tokenizer-1.0.2 lib/pragmatic_tokenizer/languages/catalan.rb
pragmatic_tokenizer-1.0.1 lib/pragmatic_tokenizer/languages/catalan.rb
pragmatic_tokenizer-1.0.0 lib/pragmatic_tokenizer/languages/catalan.rb