Sha256: e4e27e12377ab41f54ee7e3854118e2d32f4ebb2038a426e50e79f9aeb1bf128
Contents?: true
Size: 1.62 KB
Versions: 1
Compression:
Stored size: 1.62 KB
Contents
require 'open-nlp/base' class OpenNLP::SentenceDetectorME < OpenNLP::Base; end class OpenNLP::SimpleTokenizer < OpenNLP::Base; end class OpenNLP::TokenizerME < OpenNLP::Base; end class OpenNLP::POSTaggerME < OpenNLP::Base unless RUBY_PLATFORM =~ /java/ def tag(*args) @proxy_inst._invoke("tag", "[Ljava.lang.String;", args[0]) end end end class OpenNLP::ChunkerME < OpenNLP::Base if RUBY_PLATFORM =~ /java/ def chunk(tokens, tags) if !tokens.is_a?(Array) tokens = tokens.to_a tags = tags.to_a end tokens = tokens.to_java(:String) tags = tags.to_java(:String) @proxy_inst.chunk(tokens,tags).to_a end else def chunk(tokens, tags) chunks = @proxy_inst._invoke("chunk", "[Ljava.lang.String;[Ljava.lang.String;", tokens, tags) chunks.map { |c| c.to_s } end end end class OpenNLP::Parser < OpenNLP::Base def parse(text) tokenizer = OpenNLP::TokenizerME.new full_span = OpenNLP::Bindings::Span.new(0, text.size) parse_obj = OpenNLP::Bindings::Parse.new( text, full_span, "INC", 1, 0) tokens = tokenizer.tokenize_pos(text) tokens.each_with_index do |tok,i| start, stop = tok.get_start, tok.get_end token = text[start..stop-1] span = OpenNLP::Bindings::Span.new(start, stop) parse = OpenNLP::Bindings::Parse.new(text, span, "TK", 0, i) parse_obj.insert(parse) end @proxy_inst.parse(parse_obj) end end class OpenNLP::NameFinderME < OpenNLP::Base unless RUBY_PLATFORM =~ /java/ def find(*args) @proxy_inst._invoke("find", "[Ljava.lang.String;", args[0]) end end end
Version data entries
1 entries across 1 versions & 1 rubygems
Version | Path |
---|---|
open-nlp-0.1.5 | lib/open-nlp/classes.rb |