Class: Glueckskeks::CorpusReader

Inherits:
Object
  • Object
show all
Defined in:
lib/glueckskeks/corpus_reader.rb

Class Method Summary collapse

Class Method Details

.read_corpus_filesObject



3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
# File 'lib/glueckskeks/corpus_reader.rb', line 3

def self.read_corpus_files
  result_map = {}

  Dir.glob('corpus/*.corpus').each do |filename|
    Glueckskeks.logger.debug "Reading corpus file #{filename}"
    file = File.new(filename)

    lines = file.readlines

    lines.map!(&:strip!)
    lines.reject!(&:empty?)

    Glueckskeks.logger.debug "#{lines.count} valid line(s) found"
    result_map[File.basename(file, '.corpus')] = lines
  end

  result_map
end