Module: HTTP

Defined in:
lib/wiki_lyrics/utils/http.rb

Constant Summary collapse

@@user_agent =

@@user_agent = “Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.0.2) Gecko/20060308 Firefox/1.5.0.2”

"Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.1.9) Gecko/20071110 Firefox/2.0.0.9"
@@proxy_url =

@@user_agent = “Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.8.1.12) Gecko/20080218 Firefox/2.0.0.12”

nil
@@proxy_excluded_urls =
[]
@@proxy_reverse =

if true, excluded_urls list becomes a list with the only urls the proxy should be used for

false

Class Method Summary collapse

Class Method Details

.fetch_page_get(url, headers = nil, follow = 10) ⇒ Object



94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
# File 'lib/wiki_lyrics/utils/http.rb', line 94

def HTTP.fetch_page_get( url, headers=nil, follow=10 )
	begin

		p_url = HTTP.parse_uri( url )
		return nil, url if p_url.host == nil || p_url.port == nil || p_url.request_uri == nil
		proxy_host, proxy_port, proxy_user, proxy_pass = HTTP.get_url_proxy_settings( url )

		full_headers = {
			"User-Agent" => @@user_agent,
			"Referer" => "#{p_url.scheme}://#{p_url.host}",
		}
		full_headers.merge!( headers ) if headers

		http = Net::HTTP.new( p_url.host, p_url.port, proxy_host, proxy_port, proxy_user, proxy_pass )
		response = http.request_get( p_url.request_uri, full_headers )

		case response
			when Net::HTTPSuccess
			when Net::HTTPRedirection, Net::HTTPFound
				if follow == 0
					response = nil
				elsif follow > 0
					response, url = HTTP.fetch_page_get( response["location"], nil, follow-1 )
				end
			else
				response = nil
		end

		return response, url

	rescue Errno::ETIMEDOUT, Errno::EBADF, EOFError => e
		raise TimeoutError.new( e.to_s )
	end
end

.fetch_page_post(url, params, headers = nil, follow = 10) ⇒ Object



129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
# File 'lib/wiki_lyrics/utils/http.rb', line 129

def HTTP.fetch_page_post( url, params, headers=nil, follow=10 )
	begin
		p_url = HTTP.parse_uri( url )
		return nil, url if p_url.host == nil || p_url.port == nil || p_url.request_uri == nil
		proxy_host, proxy_port, proxy_user, proxy_pass = HTTP.get_url_proxy_settings( url )

		data, full_headers = URLEncodedFormData.prepare_query( params )
		full_headers["User-Agent"] = @@user_agent
		full_headers["Referer"] = "#{p_url.scheme}://#{p_url.host}"
		full_headers.merge!( headers ) if headers

		http = Net::HTTP.new( p_url.host, p_url.port, proxy_host, proxy_port, proxy_user, proxy_pass )
		response = http.request_post( p_url.request_uri, data, full_headers )

		case response
			when Net::HTTPSuccess
			when Net::HTTPRedirection, Net::HTTPFound
				if follow == 0
					response = nil
				elsif follow > 0
					response, url = HTTP.fetch_page_get( response["location"], nil, follow-1 )
				end
			else
				response = nil
		end

		return response, url

	rescue Errno::ETIMEDOUT, Errno::EBADF, EOFError => e
		raise TimeoutError.new( e.to_s )
	end
end

.fetch_page_post_form_multipart(url, params, headers = nil, follow = 10) ⇒ Object



162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
# File 'lib/wiki_lyrics/utils/http.rb', line 162

def HTTP.fetch_page_post_form_multipart( url, params, headers=nil, follow=10 )
	begin

		p_url = HTTP.parse_uri( url )
		return nil, url if p_url.host == nil || p_url.port == nil || p_url.request_uri == nil
		proxy_host, proxy_port, proxy_user, proxy_pass = HTTP.get_url_proxy_settings( url )

		data, full_headers = MultipartFormData.prepare_query( params )
		full_headers["User-Agent"] = @@user_agent
		full_headers["Referer"] = "#{p_url.scheme}://#{p_url.host}"
		full_headers.merge!( headers ) if headers

		http = Net::HTTP.new( p_url.host, p_url.port, proxy_host, proxy_port, proxy_user, proxy_pass )
		response = http.request_post( p_url.request_uri, data, full_headers )

		case response
			when Net::HTTPSuccess
			when Net::HTTPRedirection, Net::HTTPFound
				if follow == 0
					response = nil
				elsif follow > 0
					response, url = HTTP.fetch_page_get( response["location"], nil, follow-1 )
				end
			else
				response = nil
		end

		return response, url

	rescue Errno::ETIMEDOUT, Errno::EBADF, EOFError => e
		raise TimeoutError.new( e.to_s )
	end
end

.get_proxy_settingsObject



56
57
58
59
60
# File 'lib/wiki_lyrics/utils/http.rb', line 56

def HTTP.get_proxy_settings()
	ret = [@@proxy_url ? @@proxy_url.dup : nil, [], @@proxy_reverse]
	@@proxy_excluded_urls.each() { |url| ret[1][ret[1].size] = url.dup  }
	return ret
end

.get_url_proxy_settings(url) ⇒ Object

returns proxy_host, proxy_port, proxy_user, proxy_pass for given url



63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
# File 'lib/wiki_lyrics/utils/http.rb', line 63

def HTTP.get_url_proxy_settings( url )

	return nil, nil, nil, nil if ! @@proxy_url
	proxy = HTTP.parse_uri( @@proxy_url )
	return nil, nil, nil, nil if ! proxy.host
	proxy.port = 80 if ! proxy.port

	# check if given url should be treated specially
	exception = false
	@@proxy_excluded_urls.each() do |exception_url|
		if url.index( exception_url ) == 0
			exception = true
			break
		end
	end

	if exception && @@proxy_reverse || ! exception && ! @@proxy_reverse
		return proxy.host, proxy.port, proxy.user, proxy.password
	else
		return nil, nil, nil, nil
	end
end

.normalize_url(url, protocol = "http") ⇒ Object



34
35
36
37
38
39
40
41
42
# File 'lib/wiki_lyrics/utils/http.rb', line 34

def HTTP.normalize_url( url, protocol="http" )
	url = url.strip()
	protocol_regexp = /^ *([^: ]+):\/+/
	md = protocol_regexp.match( url )
	return nil if md && md[1] != protocol
	url.gsub!( /\/+$/, "" )				# remove / at the end of the url
	url.gsub!( protocol_regexp, "" )	# remove the protocol part if there was one
	return "#{protocol}://#{url}"		# reinsert protocol part assuring protocol:// form
end

.parse_uri(uri) ⇒ Object



86
87
88
89
90
91
92
# File 'lib/wiki_lyrics/utils/http.rb', line 86

def HTTP.parse_uri( uri )
	begin
		return URI.parse( uri )
	rescue URI::InvalidURIError
		return URI.parse( URI.escape( uri ) )
	end
end

.set_proxy_settings(proxy_url, excluded_urls = [], reverse = false) ⇒ Object



44
45
46
47
48
49
50
51
52
53
54
# File 'lib/wiki_lyrics/utils/http.rb', line 44

def HTTP.set_proxy_settings( proxy_url, excluded_urls=[], reverse=false )
	@@proxy_url = proxy_url ? HTTP.normalize_url( proxy_url, "http" ) : nil
	@@proxy_reverse = @@proxy_url ? reverse : false
	@@proxy_excluded_urls = []
	if @@proxy_url
		excluded_urls.each() do |url|
			url = normalize_url( url, "http" )
			@@proxy_excluded_urls.insert( -1, url ) if url && ! @@proxy_excluded_urls.include?( url )
		end
	end
end