Class: Datahen::Client::ScraperJobPage

Inherits:
Base
  • Object
show all
Defined in:
lib/datahen/client/scraper_job_page.rb

Instance Method Summary collapse

Methods inherited from Base

#auth_token, #auth_token=, #env_api_url, env_auth_token, env_ignore_ssl, #ignore_ssl, #initialize

Constructor Details

This class inherits a constructor from Datahen::Client::Base

Instance Method Details

#all(scraper_name, opts = {}) ⇒ Object



8
9
10
11
# File 'lib/datahen/client/scraper_job_page.rb', line 8

def all(scraper_name, opts={})
  params = @options.merge(opts)
  self.class.get("/scrapers/#{scraper_name}/current_job/pages", params)
end

#enqueue(scraper_name, method, url, opts = {}) ⇒ Object



50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
# File 'lib/datahen/client/scraper_job_page.rb', line 50

def enqueue(scraper_name, method, url, opts={})
  body = {}
  body[:method] =  method != "" ? method : "GET"
  body[:url] =  url
  body[:page_type] = opts[:page_type] if opts[:page_type]
  body[:priority] = opts[:priority] if opts[:priority]
  body[:fetch_type] = opts[:fetch_type] if opts[:fetch_type]
  body[:body] = opts[:body] if opts[:body]
  body[:headers] = opts[:headers] if opts[:headers]
  body[:vars] = opts[:vars] if opts[:vars]
  body[:force_fetch] = opts[:force_fetch] if opts[:force_fetch]
  body[:freshness] = opts[:freshness] if opts[:freshness]
  body[:ua_type] = opts[:ua_type] if opts[:ua_type]
  body[:no_redirect] = opts[:no_redirect] if opts[:no_redirect]
  body[:cookie] = opts[:cookie] if opts[:cookie]
  body[:max_size] = opts[:max_size] if opts[:max_size]
  body[:enable_global_cache] = opts[:enable_global_cache] if opts.has_key?("enable_global_cache") || opts.has_key?(:enable_global_cache)
  body[:retry_interval] = opts[:retry_interval] if opts[:retry_interval]

  params = @options.merge({body: body.to_json})

  self.class.post("/scrapers/#{scraper_name}/current_job/pages", params)
end

#find(scraper_name, gid) ⇒ Object



4
5
6
# File 'lib/datahen/client/scraper_job_page.rb', line 4

def find(scraper_name, gid)
  self.class.get("/scrapers/#{scraper_name}/current_job/pages/#{gid}", @options)
end

#find_content(scraper_name, gid) ⇒ Object



74
75
76
# File 'lib/datahen/client/scraper_job_page.rb', line 74

def find_content(scraper_name, gid)
  self.class.get("/scrapers/#{scraper_name}/current_job/pages/#{gid}/content", @options)
end

#find_failed_content(scraper_name, gid) ⇒ Object



78
79
80
# File 'lib/datahen/client/scraper_job_page.rb', line 78

def find_failed_content(scraper_name, gid)
  self.class.get("/scrapers/#{scraper_name}/current_job/pages/#{gid}/failed_content", @options)
end

#limbo(scraper_name, opts = {}) ⇒ Object



45
46
47
48
# File 'lib/datahen/client/scraper_job_page.rb', line 45

def limbo(scraper_name, opts={})
  params = @options.merge(opts)
  self.class.put("/scrapers/#{scraper_name}/current_job/pages/limbo", params)
end

#refetch(scraper_name, opts = {}) ⇒ Object



27
28
29
30
# File 'lib/datahen/client/scraper_job_page.rb', line 27

def refetch(scraper_name, opts={})
  params = @options.merge(opts)
  self.class.put("/scrapers/#{scraper_name}/current_job/pages/refetch", params)
end

#refetch_by_job(job_id, opts = {}) ⇒ Object

Note:

This method will be removed at some point in the future.

Deprecated, please use Datahen::Client::JobPage#refetch instead.



35
36
37
38
# File 'lib/datahen/client/scraper_job_page.rb', line 35

def refetch_by_job(job_id, opts={})
  params = @options.merge(opts)
  self.class.put("/jobs/#{job_id}/pages/refetch", params)
end

#reparse(scraper_name, opts = {}) ⇒ Object



40
41
42
43
# File 'lib/datahen/client/scraper_job_page.rb', line 40

def reparse(scraper_name, opts={})
  params = @options.merge(opts)
  self.class.put("/scrapers/#{scraper_name}/current_job/pages/reparse", params)
end

#update(scraper_name, gid, opts = {}) ⇒ Object



13
14
15
16
17
18
19
20
21
22
23
24
25
# File 'lib/datahen/client/scraper_job_page.rb', line 13

def update(scraper_name, gid, opts={})
  body = {}
  body[:page_type] = opts[:page_type] if opts[:page_type]
  body[:priority] = opts[:priority] if opts[:priority]
  body[:vars] = opts[:vars] if opts[:vars]
  body[:max_size] = opts[:max_size] if opts[:max_size]
  body[:enable_global_cache] = opts[:enable_global_cache] if opts.has_key?("enable_global_cache") || opts.has_key?(:enable_global_cache)
  body[:retry_interval] = opts[:retry_interval] if opts[:retry_interval]

  params = @options.merge({body: body.to_json})

  self.class.put("/scrapers/#{scraper_name}/current_job/pages/#{gid}", params)
end