Sha256: c4259498befa83deb4f9a55a33ae6dd43e92333a476944e74170548cfb3c9305

Contents?: true

Size: 1.97 KB

Versions: 5

Compression:

Stored size: 1.97 KB

Contents

/**
 * Copyright © 2010-2012 Atilika Inc.  All rights reserved.
 *
 * See the NOTICE.txt file distributed with this work for additional
 * information regarding copyright ownership.
 * 
 * Atilika Inc. licenses this file to you under the Apache License, Version
 * 2.0 (the "License"); you may not use this file except in compliance with
 * the License.  A copy of the License is distributed with this work in the
 * LICENSE.txt file.  You may also obtain a copy of the License from
 * 
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
 * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.  See the
 * License for the specific language governing permissions and limitations
 * under the License.
 */
package org.atilika.kuromoji.example;

import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStreamReader;
import java.util.List;

import org.atilika.kuromoji.Token;
import org.atilika.kuromoji.Tokenizer;
import org.atilika.kuromoji.Tokenizer.Mode;

public class TokenizerExample {

	public static void main(String[] args) throws IOException {
		Tokenizer tokenizer;
		if (args.length == 1) {
			Mode mode = Mode.valueOf(args[0].toUpperCase());
			tokenizer = Tokenizer.builder().mode(mode).build();
		} else if (args.length == 2) {
			Mode mode = Mode.valueOf(args[0].toUpperCase());
			tokenizer = Tokenizer.builder().mode(mode).userDictionary(args[1]).build();
		} else {
			tokenizer = Tokenizer.builder().build();
		}
		System.out.println("Tokenizer ready.  Provide input text and press RET.");
		BufferedReader reader = new BufferedReader(new InputStreamReader(System.in));
		String line;
		while ((line = reader.readLine()) != null) {
			List<Token> result = tokenizer.tokenize(line);
			for (Token token : result) {
				System.out.println(token.getSurfaceForm() + "\t"
						+ token.getAllFeatures());
			}
		}
	}
}

Version data entries

5 entries across 5 versions & 2 rubygems

Version Path
kuromoji-ruby-0.0.4 vendor/kuromoji-0.7.7/src/main/java/org/atilika/kuromoji/example/TokenizerExample.java
kuromoji-ruby-0.0.3 vendor/kuromoji-0.7.7/src/main/java/org/atilika/kuromoji/example/TokenizerExample.java
kuromoji-ruby-0.0.2 vendor/kuromoji-0.7.7/src/main/java/org/atilika/kuromoji/example/TokenizerExample.java
kuromoji-ruby-0.0.1 vendor/kuromoji-0.7.7/src/main/java/org/atilika/kuromoji/example/TokenizerExample.java
kuromoji-0.0.1 vendor/kuromoji-0.7.7/src/main/java/org/atilika/kuromoji/example/TokenizerExample.java