Module: Mitie

Defined in:
lib/mitie.rb,
lib/mitie/ffi.rb,
lib/mitie/ner.rb,
lib/mitie/utils.rb,
lib/mitie/version.rb,
lib/mitie/document.rb,
lib/mitie/ner_trainer.rb,
lib/mitie/text_categorizer.rb,
lib/mitie/ner_training_instance.rb,
lib/mitie/binary_relation_trainer.rb,
lib/mitie/binary_relation_detector.rb,
lib/mitie/text_categorizer_trainer.rb

Defined Under Namespace

Modules: FFI, Utils Classes: BinaryRelationDetector, BinaryRelationTrainer, Document, Error, NER, NERTrainer, NERTrainingInstance, TextCategorizer, TextCategorizerTrainer

Constant Summary collapse

VERSION =
"0.3.3"

Class Attribute Summary collapse

Class Method Summary collapse

Class Attribute Details

.ffi_libObject

Returns the value of attribute ffi_lib.



20
21
22
# File 'lib/mitie.rb', line 20

def ffi_lib
  @ffi_lib
end

Class Method Details

.tokenize(text) ⇒ Object



45
46
47
48
49
50
51
# File 'lib/mitie.rb', line 45

def tokenize(text)
  tokens_ptr = FFI.mitie_tokenize(+text.to_s)
  tokens_ptr.free = FFI["mitie_free"]
  tokens = read_tokens(tokens_ptr)
  tokens.each { |t| t.force_encoding(text.encoding) }
  tokens
end

.tokenize_file(filename) ⇒ Object

Raises:

  • (ArgumentError)


53
54
55
56
57
58
# File 'lib/mitie.rb', line 53

def tokenize_file(filename)
  raise ArgumentError, "File does not exist" unless File.exist?(filename)
  tokens_ptr = FFI.mitie_tokenize_file(+filename)
  tokens_ptr.free = FFI["mitie_free"]
  read_tokens(tokens_ptr)
end