Class: TwitterCldr::Resources::UnicodeDataImporter

Inherits:
UnicodeImporter show all
Defined in:
lib/twitter_cldr/resources/unicode_data_importer.rb

Constant Summary collapse

BLOCKS_URL =
'ftp://ftp.unicode.org/Public/UNIDATA/Blocks.txt'
UNICODE_DATA_URL =
'ftp://ftp.unicode.org/Public/UNIDATA/UnicodeData.txt'
CASEFOLDING_DATA_URL =
'ftp://ftp.unicode.org/Public/UNIDATA/CaseFolding.txt'

Instance Method Summary collapse

Constructor Details

#initialize(input_path, output_path) ⇒ UnicodeDataImporter

Arguments:

input_path  - path to a directory containing Blocks.txt and UnicodeData.txt
output_path - output directory for imported YAML files


22
23
24
25
# File 'lib/twitter_cldr/resources/unicode_data_importer.rb', line 22

def initialize(input_path, output_path)
  @input_path  = input_path
  @output_path = output_path
end

Instance Method Details

#importObject



27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
# File 'lib/twitter_cldr/resources/unicode_data_importer.rb', line 27

def import
  blocks           = import_blocks
  unicode_data     = import_unicode_data(blocks)
  casefolding_data = import_casefolding_data
  index_data       = build_indices(
    TwitterCldr::Shared::CodePoint::INDICES, unicode_data
  )

  File.open(File.join(@output_path, 'blocks.yml'), 'w') do |output|
    YAML.dump(blocks, output)
  end

  FileUtils.mkdir_p(File.join(@output_path, 'blocks'))

  unicode_data.each do |block_name, code_points|
    File.open(File.join(@output_path, 'blocks', "#{block_name}.yml"), 'w') do |output|
      YAML.dump(code_points, output)
    end
  end

  File.open(File.join(@output_path, 'casefolding.yml'), 'w') do |output|
    YAML.dump(casefolding_data, output)
  end

  FileUtils.mkdir_p(File.join(@output_path, 'indices'))

  indices = index_data

  indices.each_pair do |index_name, data|
    File.open(File.join(@output_path, "indices", "#{index_name}.yml"), 'w') do |output|
      YAML.dump(data, output)
    end
  end

  File.open(File.join(@output_path, "indices", "keys.yml"), 'w') do |output|
    YAML.dump(
      indices.inject({}) do |ret, (index_name, data)|
        data.keys.each do |prop|
          ret[prop] ||= []
          ret[prop] << index_name
        end
        ret
      end, output
    )
  end
end