Class: NSAStorage::Crawl

Inherits:
Object
  • Object
show all
Defined in:
lib/nsastorage/crawl.rb

Overview

Handles the crawl command via CLI.

Class Method Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(stdout: $stdout, stderr: $stderr, options: {}) ⇒ Crawl

Returns a new instance of Crawl.

Parameters:

  • stdout (IO) (defaults to: $stdout)

    optional

  • stderr (IO) (defaults to: $stderr)

    optional

  • options (Hash) (defaults to: {})

    optional



13
14
15
16
17
# File 'lib/nsastorage/crawl.rb', line 13

def initialize(stdout: $stdout, stderr: $stderr, options: {})
  @stdout = stdout
  @stderr = stderr
  @options = options
end

Class Method Details

.runObject



6
7
8
# File 'lib/nsastorage/crawl.rb', line 6

def self.run(...)
  new(...).run
end

Instance Method Details

#process(url:) ⇒ Object



27
28
29
30
31
32
33
34
35
# File 'lib/nsastorage/crawl.rb', line 27

def process(url:)
  @stdout.puts(url)
  facility = Facility.fetch(url: url)
  @stdout.puts(facility.text)
  facility.prices.each { |price| @stdout.puts(price.text) }
  @stdout.puts
rescue FetchError => e
  @stderr.puts("url=#{url} error=#{e.message}")
end

#runObject



19
20
21
22
23
24
25
# File 'lib/nsastorage/crawl.rb', line 19

def run
  sitemap = Facility.sitemap
  @stdout.puts("count=#{sitemap.links.count}")
  @stdout.puts

  sitemap.links.each { |link| process(url: link.loc) }
end