Class: PubliSci::Reader::CSV
Instance Method Summary
collapse
#interact
#abbreviate_known, #code_lists, #component_gen, #component_specifications, #concept_codes, #data_structure_definition, #dataset, #defaults, #dimension_properties, #encode_data, #generate, #generate_resources, #measure_properties, #observations, #prefixes, #vocabulary
Methods included from Parser
#get_ary, #get_hashes, #is_uri?, #load_string, #observation_hash, #sanitize, #sanitize_hash, #strip_prefixes, #strip_uri, #to_literal, #to_resource
Instance Method Details
#automatic(file = nil, dataset_name = nil, options = {}, interactive = true) ⇒ Object
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
|
# File 'lib/bio-publisci/readers/csv.rb', line 7
def automatic(file=nil,dataset_name=nil,options={},interactive=true)
unless file || !interactive
puts "Input file?"
file = gets.chomp
end
raise "CSV reader needs an input file" unless file && file.size > 0
unless dataset_name
if interactive
dataset_name = interact("Dataset name?","#{File.basename(file).split('.').first}"){|sel| File.basename(file).split('.').first }
else
dataset_name = File.basename(file).split('.').first
end
end
categories = ::CSV.read(file)[0]
unless options[:dimensions] || !interactive
options[:dimensions] = Array(interact("Dimensions?",categories[0],categories))
end
unless options[:measures] || !interactive
meas = categories - (options[:dimensions] || [categories[0]])
selection = interact("Measures?",meas,meas){|s| nil}
options[:measures] = Array(selection) unless selection == nil
end
generate_n3(file,dataset_name,options)
end
|
#codes ⇒ Object
54
55
56
|
# File 'lib/bio-publisci/readers/csv.rb', line 54
def codes
@options[:codes] || dimensions()
end
|
#dimensions ⇒ Object
50
51
52
|
# File 'lib/bio-publisci/readers/csv.rb', line 50
def dimensions
@options[:dimensions] || [@data[0][0]]
end
|
#generate_n3(file, dataset_name, options = {}) ⇒ Object
44
45
46
47
48
|
# File 'lib/bio-publisci/readers/csv.rb', line 44
def generate_n3(file, dataset_name, options={})
@data = ::CSV.read(file)
@options = options
generate(measures, dimensions, codes, observation_data, observation_labels, dataset_name, options)
end
|
#measures ⇒ Object
58
59
60
|
# File 'lib/bio-publisci/readers/csv.rb', line 58
def measures
@options[:measures] || @data[0] - dimensions()
end
|
#observation_data ⇒ Object
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
|
# File 'lib/bio-publisci/readers/csv.rb', line 74
def observation_data
obs = {}
@data[0].map{|label|
obs[label] = []
}
tmp = @data.dup
tmp.shift
tmp.map{|row|
row.each_with_index{|entry,i|
obs[@data[0][i]] << entry
}
}
obs
end
|
#observation_labels ⇒ Object
62
63
64
65
66
67
68
69
70
71
72
|
# File 'lib/bio-publisci/readers/csv.rb', line 62
def observation_labels
if @options[:label_column]
tmp = @data.dup
tmp.shift
tmp.map{|row|
row[@options[:label_column]]
}
else
(1..@data.size - 1).to_a
end
end
|