Class: Query::Result::Baidu

Inherits:
Object
  • Object
show all
Includes:
Query::Result
Defined in:
lib/query/result/baidu.rb

Instance Attribute Summary

Attributes included from Query::Result

#baseuri, #pagenumber, #perpage

Instance Method Summary collapse

Methods included from Query::Result

#initialize, #next, #rank, #raw_ranks

Instance Method Details

#ads_bottomObject



30
31
32
33
34
35
# File 'lib/query/result/baidu.rb', line 30

def ads_bottom
  # @page.search("//*[@class='result']/following-sibling::*[contains(@class,'EC_result')]").map.with_index do |div,index|
  #   parse_ad(div)#.merge(:rank => index + 1)
  # end
  ads_top
end

#ads_leftObject

def ads_top

@page.search("//*[@class='result']/preceding-sibling::*[contains(@class,'EC_result')]").map.with_index do |div, index|
  parse_ad(div).merge(:rank => index + 1)
end

end



18
19
20
21
22
# File 'lib/query/result/baidu.rb', line 18

def ads_left
  @page.xpath("//div[@id='content_left']//*[contains(@class,'EC_result')]",MyFilter.new).map.with_index do |div,index|
    parse_ad(div)#.merge(:rank => index + 1)
  end
end

#ads_rightObject



37
38
39
40
41
42
43
44
45
46
47
48
49
# File 'lib/query/result/baidu.rb', line 37

def ads_right
  @page.search("//div[@id='ec_im_container']/div[@id]").map.with_index do |div,index|
    a = div.search('a').first
    url = div.search("*[@class='EC_url']").first.text
    url = "http://#{url}"
    {
      :rank => index + 1,
      :text => a.text.strip,
      :href => a['href'].strip,
      :host => Addressable::URI.parse(URI.encode(url)).host
    }
  end
end

#ads_topObject



24
25
26
27
28
# File 'lib/query/result/baidu.rb', line 24

def ads_top
  ads_left.uniq.map.with_index do |ad,index|
    ad.merge(:rank => index + 1)
  end
end

#countObject



51
52
53
# File 'lib/query/result/baidu.rb', line 51

def count
  @count ||= @page.search("//span[@class='nums']").map{|num|num.content.gsub(/\D/,'').to_i unless num.nil?}.first
end

#has_result?Boolean

Returns:

  • (Boolean)


59
60
61
62
63
# File 'lib/query/result/baidu.rb', line 59

def has_result?
  submit = @page.search('//a[text()="提交网址"]').first
  return false if submit and submit['href'].include?'sitesubmit'
  return true
end

#next_urlObject



65
66
67
68
69
# File 'lib/query/result/baidu.rb', line 65

def next_url
  next_btn = @page.search("//a[text()='下一页>']")
  return false if next_btn.empty?
  next_btn.first['href']
end


55
56
57
# File 'lib/query/result/baidu.rb', line 55

def related_keywords
  @related_keywords ||= @page.search("//div[@id=\"rs\"]//tr//a").map{|keyword| keyword.text}
end

#seo_ranksObject



5
6
7
8
9
10
# File 'lib/query/result/baidu.rb', line 5

def seo_ranks
  return @ranks unless @ranks.nil?
  @page.search("//*[@class='result']|//*[@class='result-op']|//*[@class='result-op c-container']|//*[@class='result c-container']").map.with_index do |table,index|
    parse_seo(table).merge({:rank => index + 1})
  end
end