Module: Kuromoji

Defined in:
lib/kuromoji.rb,
lib/kuromoji/version.rb

Constant Summary collapse

Tokenizer =
Rjb::import('org.atilika.kuromoji.Tokenizer').builder.build
VERSION =
"0.0.1"

Class Method Summary collapse

Class Method Details

.process(method, sentence) ⇒ Object



17
18
19
20
21
22
23
24
25
26
# File 'lib/kuromoji.rb', line 17

def self.process(method, sentence)
  list = Tokenizer.tokenize(sentence)
  iterator = list.iterator
  tokenized = {}
  while iterator.has_next
    item = iterator.next
    tokenized[item.surface_form] = item.send(method)
  end
  tokenized
end

.reading(sentence) ⇒ Object



13
14
15
# File 'lib/kuromoji.rb', line 13

def self.reading(sentence)
  process(:getReading, sentence)
end

.tokenize(sentence) ⇒ Object



9
10
11
# File 'lib/kuromoji.rb', line 9

def self.tokenize(sentence)
  process(:all_features, sentence)
end