Class: String

Inherits:

Object

Object
String

show all

Defined in:: lib/ndr_support/string/cleaning.rb,
lib/ndr_support/string/conversions.rb

Constant Summary collapse

INVALID_CONTROL_CHARS =

/[\x00-\x08\x0b-\x0c\x0e-\x1f]/

ROMAN_ONE_TO_FIVE_MAPPING =

{ 'I' => '1', 'II' => '2', 'III' => '3', 'IIII' => '4', 'IV' => '4', 'V' => '5' }

POSTCODE_REGEXP =

/
  ^(
    [A-Z][0-9]           |
    [A-Z][0-9][0-9]      |
    [A-Z][0-9][A-Z]      |
    [A-Z][A-Z][0-9]      |
    NPT                  |
    [A-Z][A-Z][0-9][0-9] |
    [A-Z][A-Z][0-9][A-Z]
  )
  [0-9][A-Z][A-Z]
$/x

SOUNDEX_CHARS =

'BPFVCSKGJQXZDTLMNR'

SOUNDEX_NUMS =

'111122222222334556'

SOUNDEX_CHARS_EX =

'^' + SOUNDEX_CHARS

SOUNDEX_CHARS_DEL =

'^A-Z'

Instance Method Summary collapse

#clean(what) ⇒ Object
#date1 ⇒ Object
#date2 ⇒ Object
#nhs_numberize ⇒ Object

Show NHS numbers with spaces.
#orig_to_datetime ⇒ Object
#postcodeize(option = :user) ⇒ Object

Show postcode in various formats.
#soundex(census = true) ⇒ Object

desc: en.wikipedia.org/wiki/Soundex.
#sounds_like(other) ⇒ Object
#squash ⇒ Object

Used for comparing addresses.
#strip_xml_unsafe_characters ⇒ Object
#surname_and_initials ⇒ Object

Convert “SMITH JD” into “Smith JD”.
#surnameize ⇒ Object

Like titleize but copes with Scottish and Irish names.
#thedate ⇒ Object
#thetime ⇒ Object
#to_boolean ⇒ Object

Try to convert the string value into boolean.
#to_datetime ⇒ Object
#truncate_hellip(n) ⇒ Object

truncate a string, with a HTML … at the end.
#xml_unsafe? ⇒ Boolean

Instance Method Details

#clean(what) ⇒ `Object`

# File 'lib/ndr_support/string/cleaning.rb', line 46

def clean(what)
  case what
  when :nhsnumber
    delete('^0-9')[0..9]
  when :postcode, :get_postcode
    postcodeize(:db)
  when :lpi
    upcase.delete('^0-9A-Z')
  when :gender
    if self =~ /\AM(ale)?/i
      '1'
    elsif self =~ /\AF(emale)?/i
      '2'
    else
      self
    end
  when :sex
    # SECURE: BNS 2012-10-09: But may behave oddly for multi-line input
    if self =~ /^M|1/i
      '1'
    elsif self =~ /^F|2/i
      '2'
    else
      '0'
    end
  when :sex_c
    if self =~ /^M|1/i
      'M'
    elsif self =~ /^F|2/i
      'F'
    else
      ''
    end
  when :name
    substitutions = {
      '.'      => '',
      /,|;/    => ' ',
      /\s{2,}/ => ' ',
      '`'      => '\''
    }
    substitutions.inject(upcase) { |a, e| a.gsub(*e) }.strip
  when :ethniccategory
    replace_ethniccategory = {
      '0' => '0',
      '1' => 'M',
      '2' => 'N',
      '3' => 'H',
      '4' => 'J',
      '5' => 'K',
      '6' => 'R',
      '7' => '8',
      '&' => 'X',
      ' ' => 'X',
      '99' => 'X'
    }
    replace_ethniccategory[self] || upcase
  when :code
    split_on_separators.map do |code|
      code.blank? ? next : code.delete('.')
    end.compact.join(' ')
  when :code_icd
    warn '[DEPRECATION] clean(:code_icd) is deprecated - consider using clean(:icd) instead.'
    # regexp = /[A-Z][0-9]{2}(\.(X|[0-9]{1,2})|[0-9]?)( *(D|A)( |,|;|$))/
    codes = upcase.split_on_separators.delete_if { |x| x.squash.blank? }
    cleaned_codes = []
    codes.each do |code|
      if code == 'D' || code == 'A'
        cleaned_codes[-1] += code
      else
        cleaned_codes << code
      end
    end
    cleaned_codes.join(' ')
  when :icd
    codes = upcase.squish.split_on_separators.reject(&:blank?)
    codes.map { |code| code.gsub(/(?<=\d)(\.?X?)/, '') }.join(' ')
  when :code_opcs
    clean_code_opcs
  when :hospitalnumber
    self[-1..-1] =~ /\d/ ? self : self[0..-2]
  when :xmlsafe, :make_xml_safe
    strip_xml_unsafe_characters
  when :roman5
    # This deromanises roman numerals between 1 and 5
    gsub(/[IV]+/i) { |match| ROMAN_ONE_TO_FIVE_MAPPING[match.upcase] }
  when :tnmcategory
    sub!(/\A[tnm]/i, '')
    if self =~ /\Ax\z/i
      upcase
    else
      downcase
    end
  when :strip, :upcase, :itself
    # SECURE: 14-06-2017 TPG Fixed list of executable methods (whats)
    send(what)
  else
    gsub(' ?', ' ')
  end
end

#date1 ⇒ `Object`



40
41
42

# File 'lib/ndr_support/string/conversions.rb', line 40

def date1
  Daterange.new(self).date1
end

#date2 ⇒ `Object`



44
45
46

# File 'lib/ndr_support/string/conversions.rb', line 44

def date2
  Daterange.new(self).date2
end

#nhs_numberize ⇒ `Object`

Show NHS numbers with spaces

# File 'lib/ndr_support/string/conversions.rb', line 74

def nhs_numberize
  return self unless length == 10
  self[0..2] + ' ' + self[3..5] + ' ' + self[6..9]
end

#orig_to_datetime ⇒ `Object`

128	# File 'lib/ndr_support/string/conversions.rb', line 128 alias orig_to_datetime to_datetime

#postcodeize(option = :user) ⇒ `Object`

Show postcode in various formats. Parameter “option” can be :user, :compact, :db

# File 'lib/ndr_support/string/cleaning.rb', line 27

def postcodeize(option = :user)
  nspce = gsub(/[[:space:]]/, '').upcase
  unless nspce.blank? || POSTCODE_REGEXP =~ nspce
    return self # Don't change old-style or malformed postcodes
  end
  case option
  when :compact
    nspce
  when :db
    case nspce.length
    when 5 then nspce.insert(-4, '  ')
    when 6 then nspce.insert(-4, ' ')
    else nspce
    end
  else # anything else, including :user --> friendly format
    nspce.length < 5 ? nspce : nspce.insert(-4, ' ')
  end
end

#soundex(census = true) ⇒ `Object`

desc: en.wikipedia.org/wiki/Soundex

# File 'lib/ndr_support/string/conversions.rb', line 26

def soundex(census = true)
  str = upcase.delete(SOUNDEX_CHARS_DEL).squeeze

  str[0..0] + str[1..-1].
    delete(SOUNDEX_CHARS_EX).
    tr(SOUNDEX_CHARS, SOUNDEX_NUMS)[0..(census ? 2 : -1)].
    squeeze[0..(census ? 2 : -1)].
    ljust(3, '0') rescue ''
end

#sounds_like(other) ⇒ `Object`



36
37
38

# File 'lib/ndr_support/string/conversions.rb', line 36

def sounds_like(other)
  soundex == other.soundex
end

#squash ⇒ `Object`

Used for comparing addresses



21
22
23

# File 'lib/ndr_support/string/cleaning.rb', line 21

def squash
  upcase.delete('^A-Z0-9')
end

#strip_xml_unsafe_characters ⇒ `Object`



146
147
148

# File 'lib/ndr_support/string/cleaning.rb', line 146

def strip_xml_unsafe_characters
  gsub(String::INVALID_CONTROL_CHARS, '')
end

#surname_and_initials ⇒ `Object`

Convert “SMITH JD” into “Smith JD”

# File 'lib/ndr_support/string/conversions.rb', line 57

def surname_and_initials
  a = split
  initials = a.pop
  a.collect(&:capitalize).join(' ') + ' ' + initials
end

#surnameize ⇒ `Object`

Like titleize but copes with Scottish and Irish names.

# File 'lib/ndr_support/string/conversions.rb', line 64

def surnameize
  s = slice(0, 2).upcase
  if s == 'MC' || s == "O'"
    s.titleize + slice(2..-1).titleize
  else
    titleize
  end
end

#thedate ⇒ `Object`



48
49
50

# File 'lib/ndr_support/string/conversions.rb', line 48

def thedate
  Ourdate.new(self).thedate
end

#thetime ⇒ `Object`



52
53
54

# File 'lib/ndr_support/string/conversions.rb', line 52

def thetime
  Ourtime.new(self).thetime
end

#to_boolean ⇒ `Object`

Try to convert the string value into boolean

# File 'lib/ndr_support/string/conversions.rb', line 143

def to_boolean
  # SECURE: BNS 2012-10-09: But may behave oddly for multi-line input
  return true if self == true || self =~ (/^(true|t|yes|y|1)$/i)
  return false if self == false || self.nil? || self =~ (/^(false|f|no|n|0)$/i)
  fail ArgumentError, "invalid value for Boolean: \"#{self}\""
end

#to_datetime ⇒ `Object`

# File 'lib/ndr_support/string/conversions.rb', line 130

def to_datetime
  # Default timezone for to_datetime conversion is GMT, not local timezone
  default_timezone = if ActiveRecord.respond_to?(:default_timezone)
                       ActiveRecord.default_timezone
                     else
                       ActiveRecord::Base.default_timezone # Rails <= 6.1
                     end
  return to_time.to_datetime if default_timezone == :local

  orig_to_datetime
end

#truncate_hellip(n) ⇒ `Object`

truncate a string, with a HTML … at the end



80
81
82

# File 'lib/ndr_support/string/conversions.rb', line 80

def truncate_hellip(n)
  length > n ? slice(0, n - 1) + '&hellip;' : self
end

#xml_unsafe? ⇒ `Boolean`

Returns:

(Boolean)



150
151
152

# File 'lib/ndr_support/string/cleaning.rb', line 150

def xml_unsafe?
  self =~ String::INVALID_CONTROL_CHARS
end

Class: String

Constant Summary collapse

Instance Method Summary collapse

Instance Method Details

#clean(what) ⇒ Object

#date1 ⇒ Object

#date2 ⇒ Object

#nhs_numberize ⇒ Object

#orig_to_datetime ⇒ Object

#postcodeize(option = :user) ⇒ Object

#soundex(census = true) ⇒ Object

#sounds_like(other) ⇒ Object

#squash ⇒ Object

#strip_xml_unsafe_characters ⇒ Object

#surname_and_initials ⇒ Object

#surnameize ⇒ Object

#thedate ⇒ Object

#thetime ⇒ Object

#to_boolean ⇒ Object

#to_datetime ⇒ Object

#truncate_hellip(n) ⇒ Object

#xml_unsafe? ⇒ Boolean