Module: Kuromoji
- Defined in:
- lib/kuromoji.rb,
lib/kuromoji/version.rb
Constant Summary collapse
- Tokenizer =
Rjb::import('org.atilika.kuromoji.Tokenizer').builder.build
- VERSION =
"0.0.1"
Class Method Summary collapse
Class Method Details
.process(method, sentence) ⇒ Object
17 18 19 20 21 22 23 24 25 26 |
# File 'lib/kuromoji.rb', line 17 def self.process(method, sentence) list = Tokenizer.tokenize(sentence) iterator = list.iterator tokenized = {} while iterator.has_next item = iterator.next tokenized[item.surface_form] = item.send(method) end tokenized end |
.reading(sentence) ⇒ Object
13 14 15 |
# File 'lib/kuromoji.rb', line 13 def self.reading(sentence) process(:getReading, sentence) end |
.tokenize(sentence) ⇒ Object
9 10 11 |
# File 'lib/kuromoji.rb', line 9 def self.tokenize(sentence) process(:all_features, sentence) end |