Sha256: 85b6d2ff60eac7277805e0e4aa72e7fb64345e1e6dae9348295fce2b5e9a79f1
Contents?: true
Size: 862 Bytes
Versions: 27
Compression:
Stored size: 862 Bytes
Contents
# encoding: UTF-8 # Copyright 2012 Twitter, Inc # http://www.apache.org/licenses/LICENSE-2.0 module TwitterCldr module Tokenizers class TimeTokenizer class << self def tokenizer @tokenizer ||= Tokenizer.new([ TokenRecognizer.new(:pattern, /^(a{1}|B{1,5}|h{1,2}|H{1,2}|K{1,2}|k{1,2}|m{1,2}|s{1,2}|S+|z{1,4}|Z{1,4}V{1,4}|v{1,4})/), TokenRecognizer.new(:plaintext, //) ], /(\'[\w\s-]+\'|a{1}|B{1,5}|h{1,2}|H{1,2}|K{1,2}|k{1,2}|m{1,2}|s{1,2}|S+|z{1,4}|Z{1,4}|V{1,4}|v{1,4})/) end end attr_reader :data_reader def initialize(data_reader) @data_reader = data_reader end def tokenize(pattern) PatternTokenizer.new(data_reader, tokenizer).tokenize(pattern) end def tokenizer self.class.tokenizer end end end end
Version data entries
27 entries across 27 versions & 1 rubygems