Module: PragmaticTokenizer

Defined in:
lib/pragmatic_tokenizer/version.rb,
lib/pragmatic_tokenizer/languages.rb,
lib/pragmatic_tokenizer/tokenizer.rb,
lib/pragmatic_tokenizer/pre_processor.rb,
lib/pragmatic_tokenizer/post_processor.rb,
lib/pragmatic_tokenizer/languages/czech.rb,
lib/pragmatic_tokenizer/languages/dutch.rb,
lib/pragmatic_tokenizer/languages/greek.rb,
lib/pragmatic_tokenizer/languages/arabic.rb,
lib/pragmatic_tokenizer/languages/common.rb,
lib/pragmatic_tokenizer/languages/danish.rb,
lib/pragmatic_tokenizer/languages/french.rb,
lib/pragmatic_tokenizer/languages/polish.rb,
lib/pragmatic_tokenizer/languages/slovak.rb,
lib/pragmatic_tokenizer/languages/catalan.rb,
lib/pragmatic_tokenizer/languages/deutsch.rb,
lib/pragmatic_tokenizer/languages/english.rb,
lib/pragmatic_tokenizer/languages/finnish.rb,
lib/pragmatic_tokenizer/languages/italian.rb,
lib/pragmatic_tokenizer/languages/latvian.rb,
lib/pragmatic_tokenizer/languages/persian.rb,
lib/pragmatic_tokenizer/languages/russian.rb,
lib/pragmatic_tokenizer/languages/spanish.rb,
lib/pragmatic_tokenizer/languages/swedish.rb,
lib/pragmatic_tokenizer/languages/turkish.rb,
lib/pragmatic_tokenizer/languages/romanian.rb,
lib/pragmatic_tokenizer/full_stop_separator.rb,
lib/pragmatic_tokenizer/languages/bulgarian.rb,
lib/pragmatic_tokenizer/languages/norwegian.rb,
lib/pragmatic_tokenizer/languages/indonesian.rb,
lib/pragmatic_tokenizer/languages/portuguese.rb,
lib/pragmatic_tokenizer/ending_punctuation_separator.rb

Defined Under Namespace

Modules: Languages Classes: EndingPunctuationSeparator, FullStopSeparator, PostProcessor, PreProcessor, Tokenizer

Constant Summary collapse

VERSION =
"1.0.0"