Module: PreProcessor

Defined in:
lib/biodiversity/parser.rb

Constant Summary collapse

NOTES =
/\s+(species\s+group|species\s+complex|group|author)\b.*$/i
TAXON_CONCEPTS1 =
/\s+(sensu\.|sensu|auct\.|auct)\b.*$/i
TAXON_CONCEPTS2 =
/\s+(\(?s\.\s?s\.|\(?s\.\s?l\.|\(?s\.\s?str\.|\(?s\.\s?lat\.|sec\.|sec|near)\b.*$/
TAXON_CONCEPTS3 =
/(,\s*|\s+)(pro parte|p.\s?p.)\s*$/i
NOMEN_CONCEPTS =
/(,\s*|\s+)(\(?nomen|\(?nom\.|\(?comb\.).*$/i
LAST_WORD_JUNK =
/(,\s*|\s+)(von|van|sensu|new|non|nec|cf|ssp|subsp|subgen|hybrid|hort.|hort)\s*$/i

Class Method Summary collapse

Class Method Details

.clean(a_string) ⇒ Object



17
18
19
20
21
22
23
# File 'lib/biodiversity/parser.rb', line 17

def self.clean(a_string)
  [NOTES, TAXON_CONCEPTS1, TAXON_CONCEPTS2, TAXON_CONCEPTS3, NOMEN_CONCEPTS, LAST_WORD_JUNK].each do |i|
    a_string = a_string.gsub(i, '')
  end
  a_string = a_string.tr('ſ','s') #old 's'
  a_string
end