Module: PragmaticTokenizer::Languages

Defined in:
lib/pragmatic_tokenizer/languages.rb,
lib/pragmatic_tokenizer/languages/czech.rb,
lib/pragmatic_tokenizer/languages/dutch.rb,
lib/pragmatic_tokenizer/languages/greek.rb,
lib/pragmatic_tokenizer/languages/arabic.rb,
lib/pragmatic_tokenizer/languages/common.rb,
lib/pragmatic_tokenizer/languages/danish.rb,
lib/pragmatic_tokenizer/languages/french.rb,
lib/pragmatic_tokenizer/languages/polish.rb,
lib/pragmatic_tokenizer/languages/slovak.rb,
lib/pragmatic_tokenizer/languages/catalan.rb,
lib/pragmatic_tokenizer/languages/deutsch.rb,
lib/pragmatic_tokenizer/languages/english.rb,
lib/pragmatic_tokenizer/languages/finnish.rb,
lib/pragmatic_tokenizer/languages/italian.rb,
lib/pragmatic_tokenizer/languages/latvian.rb,
lib/pragmatic_tokenizer/languages/persian.rb,
lib/pragmatic_tokenizer/languages/russian.rb,
lib/pragmatic_tokenizer/languages/spanish.rb,
lib/pragmatic_tokenizer/languages/swedish.rb,
lib/pragmatic_tokenizer/languages/turkish.rb,
lib/pragmatic_tokenizer/languages/romanian.rb,
lib/pragmatic_tokenizer/languages/bulgarian.rb,
lib/pragmatic_tokenizer/languages/norwegian.rb,
lib/pragmatic_tokenizer/languages/indonesian.rb,
lib/pragmatic_tokenizer/languages/portuguese.rb

Defined Under Namespace

Modules: Arabic, Bulgarian, Catalan, Common, Czech, Danish, Deutsch, Dutch, English, Finnish, French, Greek, Indonesian, Italian, Latvian, Norwegian, Persian, Polish, Portuguese, Romanian, Russian, Slovak, Spanish, Swedish, Turkish

Constant Summary collapse

LANGUAGE_CODES =
{
    :en => English,
    :ar => Arabic,
    :bg => Bulgarian,
    :ca => Catalan,
    :cs => Czech,
    :da => Danish,
    :de => Deutsch,
    :el => Greek,
    :es => Spanish,
    :fa => Persian,
    :fi => Finnish,
    :fr => French,
    :id => Indonesian,
    :it => Italian,
    :lv => Latvian,
    :nl => Dutch,
    :nn => Norwegian,
    :nb => Norwegian,
    :no => Norwegian,
    :pl => Polish,
    :pt => Portuguese,
    :ro => Romanian,
    :ru => Russian,
    :sk => Slovak,
    :sv => Swedish,
    :tr => Turkish
}.freeze

Class Method Summary collapse

Class Method Details

.get_language_by_code(code) ⇒ Object



59
60
61
62
# File 'lib/pragmatic_tokenizer/languages.rb', line 59

def self.get_language_by_code(code)
  code = code ? code.to_sym : :en
  LANGUAGE_CODES[code] || Common
end