Method: Apollo::Crawler::GoogleCrawler#extract_data

Defined in:
lib/apollo_crawler/crawler/google_crawler.rb

#extract_data(doc) ⇒ Object



36
37
38
39
40
41
42
43
44
45
46
# File 'lib/apollo_crawler/crawler/google_crawler.rb', line 36

def extract_data(doc)
	res = doc.xpath(@@MATCHER_ITEM).map { | node |
		url = BaseCrawler.try_get_url(self.url, node['href'])
		next if url.nil?

		{ 
			:text => node.text,
			:link => url
		}
	}
end