Module: TextUtils::ValueHelper

Included in:
ValuesReader
Defined in:
lib/textutils/helper/value_helper.rb

Instance Method Summary collapse

Instance Method Details

#find_grade(value) ⇒ Object

NB: returns ary [grade,value] / two values



147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
# File 'lib/textutils/helper/value_helper.rb', line 147

def find_grade( value )  # NB: returns ary [grade,value] / two values
  grade = 4  # defaults to grade 4  e.g  *** => 1, ** => 2, * => 3, -/- => 4

  # NB: stars must end field/value or start field/value
  #  e.g.
  #  *** Anton Bauer   or
  #  Anton Bauer ***

  value = value.sub( /^\s*(\*{1,3})\s+/ ) do |_|
    if $1 == '***'
      grade = 1
    elsif $1 == '**'
      grade = 2
    elsif $1 == '*'
      grade = 3
    else
      # unknown grade; not possible, is'it?
    end
    ''  # remove * from title if found
  end

  value = value.sub( /\s+(\*{1,3})\s*$/ ) do |_|
    if $1 == '***'
      grade = 1
    elsif $1 == '**'
      grade = 2
    elsif $1 == '*'
      grade = 3
    else
      # unknown grade; not possible, is'it?
    end
    ''  # remove * from title if found
  end

  [grade,value]
end

#find_key_n_title(values) ⇒ Object

NB: returns ary [attribs,more_values] / two values



185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
# File 'lib/textutils/helper/value_helper.rb', line 185

def find_key_n_title( values )  # NB: returns ary [attribs,more_values] / two values

  ## fix: add/configure logger for ActiveRecord!!!
  logger = LogKernel::Logger.root

  ### todo/fix: allow check - do NOT allow mixed use of with key and w/o key
  ##  either use keys or do NOT use keys; do NOT mix in a single fixture file

  ### support autogenerate key from first title value

  # if it looks like a key (only a-z lower case allowed); assume it's a key
  #   - also allow . in keys e.g. world.quali.america, at.cup, etc.
  #   - also allow 0-9 in keys e.g. at.2, at.3.1, etc.

  # fix/todo: add support for leading underscore _
  #   or allow keys starting w/ digits?
  
  # NB: key must start w/ a-z letter (NB: minimum one letter possible)
  if values[0] =~ /^([a-z][a-z0-9.]*[a-z0-9]|[a-z])$/
    key_col         = values[0]
    title_col       = values[1]
    more_values     = values[2..-1]
  else
    key_col         = '<auto>'
    title_col       = values[0]
    more_values     = values[1..-1]
  end

  attribs = {}

  ## check title_col for grade (e.g. ***/**/*) and use returned stripped title_col if exits
  grade, title_col = find_grade( title_col )

  # NB: for now - do NOT include default grade e.g. if grade (***/**/*) not present; attrib will not be present too
  if grade == 1 || grade == 2 || grade == 3  # grade found/present
    logger.debug "   found grade #{grade} in title"
    attribs[:grade] = grade
  end

  ## fix/todo: add find parts ??
  #  e.g. ‹Estrella› ‹Damm› Inedit
  #    becomes =>   title: 'Estrella Damm Inedit'  and  parts: ['Estrella','Damm']

  ## title (split of optional synonyms)
  # e.g. FC Bayern Muenchen|Bayern Muenchen|Bayern
  titles = title_col.split('|')

  attribs[ :title ]    =  titles[0]

  ## add optional synonyms if present
  attribs[ :synonyms ] =  titles[1..-1].join('|')  if titles.size > 1

  if key_col == '<auto>'
    ## autogenerate key from first title
    key_col = TextUtils.title_to_key( titles[0] )
    logger.debug "   autogen key »#{key_col}« from title »#{titles[0]}«"
  end

  attribs[ :key ] = key_col

  [attribs, more_values]
end

#is_address?(value) ⇒ Boolean

Returns:

  • (Boolean)


128
129
130
131
132
133
134
# File 'lib/textutils/helper/value_helper.rb', line 128

def is_address?( value )
  # if value includes // assume address e.g. 3970 Weitra // Sparkasseplatz 160
  match_result =  value =~ /\/{2}/
  # match found if 0,1,2,3 etc or no match if nil
  # note: return bool e.g. false|true  (not 0,1,2,3 etc. and nil)
  match_result != nil
end

#is_taglist?(value) ⇒ Boolean

Returns:

  • (Boolean)


136
137
138
139
140
141
142
143
144
# File 'lib/textutils/helper/value_helper.rb', line 136

def is_taglist?( value )
  ### note: cannot start w/ number must be letter for now
  ##  -- in the future allow free standing years (e.g. 1980 etc.?? why? why not?)
  ##  e.g. not allowed  14 ha or 5_000 hl etc.
  match_result =  value =~ /^([a-z][a-z0-9\|_ ]*[a-z0-9]|[a-z])$/
  # match found if 0,1,2,3 etc or no match if nil
  # note: return bool e.g. false|true  (not 0,1,2,3 etc. and nil)
  match_result != nil
end

#is_website?(value) ⇒ Boolean

Returns:

  • (Boolean)


104
105
106
107
108
109
110
111
112
113
114
# File 'lib/textutils/helper/value_helper.rb', line 104

def is_website?( value )
  # check for url/internet address e.g. www.ottakringer.at
  #  - must start w/  www. or
  #  - must end w/   .com
  #
  # fix: support more url format (e.g. w/o www. - look for .com .country code etc.)
  match_result =  value =~ /^www\.|\.com$/
  # match found if 0,1,2,3 etc or no match if nil
  # note: return bool e.g. false|true  (not 0,1,2,3 etc. and nil)
  match_result != nil
end

#is_year?(value) ⇒ Boolean

Returns:

  • (Boolean)


22
23
24
25
26
27
28
# File 'lib/textutils/helper/value_helper.rb', line 22

def is_year?( value )
  # founded/established year e.g. 1776
  match_result =  value =~ /^[0-9]{4}$/
  # match found if 0,1,2,3 etc or no match if nil
  # note: return bool e.g. false|true  (not 0,1,2,3 etc. and nil)
  match_result != nil
end

#match_abv(value) ⇒ Object

alcohol by volume (abv) e.g. 5.2%



64
65
66
67
68
69
70
71
72
# File 'lib/textutils/helper/value_helper.rb', line 64

def match_abv( value )  # alcohol by volume (abv) e.g. 5.2% 
  if value =~ /^<?\s*(\d+(?:\.\d+)?)\s*%$/
    # nb: allow leading < e.g. <0.5%
    yield( $1.to_f )  # convert to decimal? how? use float?
    true # bingo - match found
  else
    false # no match found
  end
end

#match_brewery(value) ⇒ Object

fix: move to beerdb ??? why? why not?? - yes, move to beerdb-models



10
11
12
13
14
15
16
17
18
19
# File 'lib/textutils/helper/value_helper.rb', line 10

def match_brewery( value )
  if value =~ /^by:/   ## by:  -brewed by/brewery
    brewery_key = value[3..-1]  ## cut off by: prefix
    brewery = BeerDb::Model::Brewery.find_by_key!( brewery_key )
    yield( brewery )
    true # bingo - match found
  else
    false # no match found
  end
end

#match_hl(value) ⇒ Object

hector liters (hl) 1hl = 100l



94
95
96
97
98
99
100
101
# File 'lib/textutils/helper/value_helper.rb', line 94

def match_hl( value )  # hector liters (hl) 1hl = 100l
  if value =~ /^(?:([0-9][0-9_ ]+[0-9]|[0-9]{1,2})\s*hl)$/  # e.g. 20_000 hl or 50hl etc.
    yield( $1.gsub( /[ _]/, '' ).to_i )
    true # bingo - match found
  else
    false # no match found
  end
end

#match_kcal(value) ⇒ Object



84
85
86
87
88
89
90
91
92
# File 'lib/textutils/helper/value_helper.rb', line 84

def match_kcal( value )
  if value =~ /^(\d+(?:\.\d+)?)\s*kcal(?:\/100ml)?$/  # kcal
    # nb: allow 44.4 kcal/100ml or 44.4 kcal or 44.4kcal
    yield( $1.to_f )  # convert to decimal? how? use float?
    true # bingo - match found
  else
    false # no match found
  end
end

#match_km_squared(value) ⇒ Object



41
42
43
44
45
46
47
48
49
50
# File 'lib/textutils/helper/value_helper.rb', line 41

def match_km_squared( value )
  ## allow numbers like 453 km² or 45_000 km2
  if value =~ /^([0-9][0-9 _]+[0-9]|[0-9]{1,2})(?:\s*(?:km2|km²)\s*)$/
    num = value.gsub( 'km2', '').gsub( 'km²', '' ).gsub(/[ _]/, '').to_i
    yield( num )
    true # bingo - match found
  else
    false # no match found
  end
end

#match_number(value) ⇒ Object



52
53
54
55
56
57
58
59
60
61
# File 'lib/textutils/helper/value_helper.rb', line 52

def match_number( value )
  ## numeric (nb: can use any _ or spaces inside digits e.g. 1_000_000 or 1 000 000)
  if value =~ /^([0-9][0-9 _]+[0-9])|([0-9]{1,2})$/
    num = value.gsub(/[ _]/, '').to_i
    yield( num )
    true # bingo - match found
  else
    false # no match found
  end
end

#match_og(value) ⇒ Object

plato (stammwuerze/gravity?) e.g. 11.2°



74
75
76
77
78
79
80
81
82
# File 'lib/textutils/helper/value_helper.rb', line 74

def match_og( value ) # plato (stammwuerze/gravity?) e.g. 11.2°
  if value =~ /^(\d+(?:\.\d+)?)°$/
    # nb: no whitespace allowed between ° and number e.g. 11.2°
    yield( $1.to_f )  # convert to decimal? how? use float?
    true # bingo - match found
  else
    false # no match found
  end
end

#match_website(value) ⇒ Object



116
117
118
119
120
121
122
123
124
# File 'lib/textutils/helper/value_helper.rb', line 116

def match_website( value )
  if is_website?( value )   # check for url/internet address e.g. www.ottakringer.at
    # fix: support more url format (e.g. w/o www. - look for .com .country code etc.)
    yield( value )
    true # bingo - match found
  else
    false # no match found
  end
end

#match_year(value) ⇒ Object



31
32
33
34
35
36
37
38
# File 'lib/textutils/helper/value_helper.rb', line 31

def match_year( value )
  if is_year?( value )  # founded/established year e.g. 1776
    yield( value.to_i )
    true # bingo - match found
  else
    false # no match found
  end
end