Module: Iev::Utilities

Included in:
SourceParser, TermBuilder
Defined in:
lib/iev/utilities.rb

Constant Summary collapse

SIMG_PATH_REGEX =
"<simg .*\\/\\$file\\/([\\d\\-\\w\.]+)>"
FIGURE_ONE_REGEX =
'<p><b>\\s*Figure\\s+(\\d)\\s+[–-]\\s+(.+)\\s*<\\/b>(<\\/p>)?'
FIGURE_TWO_REGEX =
"#{FIGURE_ONE_REGEX}\\s*#{FIGURE_ONE_REGEX}".freeze
IMAGE_PATH_PREFIX =
"image::/assets/images/parts"

Instance Method Summary collapse

Instance Method Details

#parse_anchor_tag(text, term_domain) ⇒ Object



11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
# File 'lib/iev/utilities.rb', line 11

def parse_anchor_tag(text, term_domain)
  return unless text

  # Convert IEV term references
  # Convert href links
  # Need to take care of this pattern:
  #  `inverse de la <a href="IEV103-06-01">période<a>`
  text.gsub(
    %r{<a href="?(IEV)\s*(\d\d\d-\d\d-\d\d\d?)"?>(.*?)</?a>},
    '{{\3, \1:\2}}',
  ).gsub(
    %r{<a href="?\s*(\d\d\d-\d\d-\d\d\d?)"?>(.*?)</?a>},
    '{{\3, IEV:\2}}',
  ).gsub(
    # To handle <a> tags without ending tag like
    #  `Voir <a href=IEV103-05-21>IEV 103-05-21`
    #  for concept '702-03-11' in `fr`
    /<a href="?(IEV)?\s*(\d\d\d-\d\d-\d\d\d?)"?>(.*?)$/,
    '{{\3, IEV:\2}}',
  ).gsub(
    %r{<a href="?([^<>]*?)"?>(.*?)</a>},
    '\1[\2]',
  ).gsub(
    Regexp.new([SIMG_PATH_REGEX, '\\s*', FIGURE_TWO_REGEX].join),
    "#{IMAGE_PATH_PREFIX}/#{term_domain}/\\1[Figure \\2 - \\3; \\6]",
  ).gsub(
    Regexp.new([SIMG_PATH_REGEX, '\\s*', FIGURE_ONE_REGEX].join),
    "#{IMAGE_PATH_PREFIX}/#{term_domain}/\\1[Figure \\2 - \\3]",
  ).gsub(
    /<img\s+([^<>]+?)\s*>/,
    "#{IMAGE_PATH_PREFIX}/#{term_domain}/\\1[]",
  ).gsub(
    /<br>/,
    "\n",
  ).gsub(
    %r{<b>(.*?)</b>},
    '*\\1*',
  )
end

#replace_newlines(input) ⇒ Object



51
52
53
54
55
56
# File 'lib/iev/utilities.rb', line 51

def replace_newlines(input)
  input.gsub('\n', "\n\n")
    .gsub(/<[pbr]+>/, "\n\n")
    .gsub(/\s*\n[\n\s]+/, "\n\n")
    .strip
end