Class: Onebox::Engine::WhitelistedGenericOnebox
Constant Summary
DEFAULT
Instance Attribute Summary
#cache, #timeout, #uri, #url
Class Method Summary
collapse
Instance Method Summary
collapse
#layout, max_text
add_oembed_provider, add_opengraph_provider, #always_https?, oembed_providers, opengraph_providers, #raw
engines, included, #initialize, #options, #options=
Class Method Details
.===(other) ⇒ Object
180
181
182
183
184
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 180
def self.===(other)
other.kind_of?(URI) ?
host_matches(other, whitelist) || probable_wordpress(other) || probable_discourse(other) :
super
end
|
.default_html_providers ⇒ Object
Often using the html attribute is not what we want, like for some blogs that include the entire page HTML. However for some providers like Flickr it allows us to return gifv and galleries.
143
144
145
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 143
def self.default_html_providers
['Flickr', 'Meetup']
end
|
.default_whitelist ⇒ Object
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 18
def self.default_whitelist
%w(
23hq.com
500px.com
8tracks.com
abc.net.au
about.com
answers.com
arstechnica.com
ask.com
battle.net
bbc.co.uk
bbs.boingboing.net
bestbuy.ca
bestbuy.com
blip.tv
bloomberg.com
businessinsider.com
change.org
clikthrough.com
cnet.com
cnn.com
codepen.io
collegehumor.com
consider.it
coursera.org
cracked.com
dailymail.co.uk
dailymotion.com
deadline.com
dell.com
deviantart.com
digg.com
dotsub.com
ebay.ca
ebay.co.uk
ebay.com
ehow.com
espn.go.com
etsy.com
findery.com
folksy.com
forbes.com
foxnews.com
funnyordie.com
gfycat.com
gifs.com
groupon.com
howtogeek.com
huffingtonpost.ca
huffingtonpost.com
hulu.com
ign.com
ikea.com
imdb.com
indiatimes.com
instagr.am
instagram.com
itunes.apple.com
khanacademy.org
kickstarter.com
kinomap.com
lessonplanet.com
liveleak.com
livestream.com
mashable.com
medium.com
meetup.com
mixcloud.com
mlb.com
myshopify.com
myspace.com
nba.com
npr.org
nytimes.com
photobucket.com
pinterest.com
reference.com
revision3.com
rottentomatoes.com
samsung.com
screenr.com
scribd.com
slideshare.net
sourceforge.net
speakerdeck.com
spotify.com
squidoo.com
streamable.com
techcrunch.com
ted.com
thefreedictionary.com
theglobeandmail.com
thenextweb.com
theonion.com
thestar.com
thesun.co.uk
thinkgeek.com
tmz.com
torontosun.com
tumblr.com
twitch.tv
twitpic.com
usatoday.com
viddler.com
videojug.com
vimeo.com
vine.co
walmart.com
washingtonpost.com
wi.st
wikia.com
wikihow.com
wired.com
wistia.com
wonderhowto.com
wsj.com
zappos.com
zillow.com
)
end
|
.host_matches(uri, list) ⇒ Object
168
169
170
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 168
def self.host_matches(uri, list)
!!list.find {|h| %r((^|\.)#{Regexp.escape(h)}$).match(uri.host) }
end
|
.html_providers ⇒ Object
147
148
149
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 147
def self.html_providers
@html_providers ||= default_html_providers.dup
end
|
.html_providers=(new_provs) ⇒ Object
151
152
153
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 151
def self.html_providers=(new_provs)
@html_providers = new_provs
end
|
.https_hosts ⇒ Object
164
165
166
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 164
def self.https_hosts
%w(slideshare.net dailymotion.com livestream.com)
end
|
.probable_discourse(uri) ⇒ Object
172
173
174
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 172
def self.probable_discourse(uri)
!!(uri.path =~ /\/t\/[^\/]+\/\d+(\/\d+)?(\?.*)?$/)
end
|
.probable_wordpress(uri) ⇒ Object
176
177
178
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 176
def self.probable_wordpress(uri)
!!(uri.path =~ /\d{4}\/\d{2}\//)
end
|
.rewrites ⇒ Object
A re-written URL converts http:// -> https://
156
157
158
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 156
def self.rewrites
@rewrites ||= https_hosts.dup
end
|
.rewrites=(new_list) ⇒ Object
160
161
162
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 160
def self.rewrites=(new_list)
@rewrites = new_list
end
|
.whitelist ⇒ Object
14
15
16
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 14
def self.whitelist
@whitelist ||= default_whitelist.dup
end
|
.whitelist=(list) ⇒ Object
10
11
12
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 10
def self.whitelist=(list)
@whitelist = list
end
|
Instance Method Details
#data ⇒ Object
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 197
def data
@data ||= begin
html_entities = HTMLEntities.new
d = { link: link }.merge(raw)
if !Onebox::Helpers.blank?(d[:title])
d[:title] = html_entities.decode(Onebox::Helpers.truncate(d[:title].strip, 80))
end
d[:description] ||= d[:summary]
if !Onebox::Helpers.blank?(d[:description])
d[:description] = html_entities.decode(Sanitize.fragment(Onebox::Helpers.truncate(d[:description].strip, 250)))
end
if !Onebox::Helpers.blank?(d[:domain])
d[:domain] = "http://#{d[:domain]}" unless d[:domain] =~ /^https?:\/\//
d[:domain] = URI(d[:domain]).host.to_s.sub(/^www\./, '') rescue nil
end
d[:image] = d[:image_secure_url] || d[:image_url] || d[:thumbnail_url] || d[:image]
d[:video] = d[:video_secure_url] || d[:video_url] || d[:video]
d
end
end
|
#placeholder_html ⇒ Object
190
191
192
193
194
195
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 190
def placeholder_html
return article_html if is_article?
return image_html if has_image? && (is_video? || is_image?)
return article_html if has_text? && is_embedded?
to_html
end
|
#to_html ⇒ Object
186
187
188
|
# File 'lib/onebox/engine/whitelisted_generic_onebox.rb', line 186
def to_html
rewrite_https(generic_html)
end
|