Sha256: c4259498befa83deb4f9a55a33ae6dd43e92333a476944e74170548cfb3c9305
Contents?: true
Size: 1.97 KB
Versions: 5
Compression:
Stored size: 1.97 KB
Contents
/** * Copyright © 2010-2012 Atilika Inc. All rights reserved. * * See the NOTICE.txt file distributed with this work for additional * information regarding copyright ownership. * * Atilika Inc. licenses this file to you under the Apache License, Version * 2.0 (the "License"); you may not use this file except in compliance with * the License. A copy of the License is distributed with this work in the * LICENSE.txt file. You may also obtain a copy of the License from * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the * License for the specific language governing permissions and limitations * under the License. */ package org.atilika.kuromoji.example; import java.io.BufferedReader; import java.io.IOException; import java.io.InputStreamReader; import java.util.List; import org.atilika.kuromoji.Token; import org.atilika.kuromoji.Tokenizer; import org.atilika.kuromoji.Tokenizer.Mode; public class TokenizerExample { public static void main(String[] args) throws IOException { Tokenizer tokenizer; if (args.length == 1) { Mode mode = Mode.valueOf(args[0].toUpperCase()); tokenizer = Tokenizer.builder().mode(mode).build(); } else if (args.length == 2) { Mode mode = Mode.valueOf(args[0].toUpperCase()); tokenizer = Tokenizer.builder().mode(mode).userDictionary(args[1]).build(); } else { tokenizer = Tokenizer.builder().build(); } System.out.println("Tokenizer ready. Provide input text and press RET."); BufferedReader reader = new BufferedReader(new InputStreamReader(System.in)); String line; while ((line = reader.readLine()) != null) { List<Token> result = tokenizer.tokenize(line); for (Token token : result) { System.out.println(token.getSurfaceForm() + "\t" + token.getAllFeatures()); } } } }
Version data entries
5 entries across 5 versions & 2 rubygems