Class: Roebe::DownloadFromThisUrl
- Inherits:
-
Base
show all
- Defined in:
- lib/roebe/classes/download_from_this_url.rb
Overview
Roebe::DownloadFromThisUrl
Constant Summary
collapse
- NON_GREEDY_REGEX_FOR_A_HREF_LINKS =
#
NON_GREEDY_REGEX_FOR_A_HREF_LINKS
See:
https://rubular.com/r/tsIqWtdx11QZmv
#
/<a href="(.+?)">?/
Constants inherited
from Base
Base::COLOURS, Base::HOME_DIRECTORY_OF_USER_X, Base::N, Base::NAMESPACE
Class Method Summary
collapse
-
.[](i = '') ⇒ Object
# === Roebe::DownloadFromThisUrl[] ========================================================================= #.
Instance Method Summary
collapse
Methods inherited from Base
#actions, #append_this_onto_that_file, #append_what_into, #be_silent, #be_verbose?, #beautiful_url, #burlywood, #call_next, #chdir, #cheerful_guy, #cliner, #complex_esystem, #convert_global_env, #copy_directory, #copy_file, #cornflowerblue, #create_directory, #crimson, #current_month?, #current_time?, #current_year?, #cyan, #darkcyan, #darkgreen, #darkkhaki, #darkslateblue, #deeppink, #delete_symlink, #do_not_use_the_base_colours, #do_use_the_base_colours, #e, #ecomment, #editor_to_use?, #efancy, #eimp, #emphasis, #ensure_main_encoding, #ensure_utf_encoding, #eparse, #erev, #esteelblue, #etomato, #ewarn, #exit_program, #firebrick, #get_current_day, #get_current_month, #get_files_and_directories, #get_files_from, #get_german_name_for_this_weekday, #gold, #green, #grey, #hh_mm_ss, #hh_mm_ss_day_month_year, #home_dir?, #home_directory_of_user_x?, #infer_the_namespace, #internal_hash?, #is_a_directory?, #is_a_file?, #is_a_jpg_file?, #is_an_image_file?, #is_archive?, #is_audio_file?, #is_in_studium_dir?, #is_multimedia_file?, #is_on_roebe?, #is_on_windows?, #is_studium_available?, #is_symlink?, #is_this_a_ruby_file?, #is_video_file?, #iso_encoding?, #le, #left_colour, #lightblue, #lightgreen, #lightseagreen, #lightsteelblue, #lime, #limegreen, #localhost_to_data, #log_directory?, #main_encoding?, #mediumorchid, #mediumpurple, #mediumseagreen, #mediumslateblue, #mediumspringgreen, #mediumturquoise, #mkdir_p, #mv, #n_days_in_this_month, #n_pages_in_this_pdf_file?, #namespace?, #no_file_exists_at, #ogrey, #olive, #olivedrab, #open_in_browser, #opne, #opnesystem, #opnn, #orange, #orchid, #orev, #palegoldenrod, #palevioletred, #pink, #powderblue, #programs_dir?, #project_base_dir?, #random_html_colour, #rds, #read_file_in_iso_encoding, #read_file_via_the_default_encoding, #read_lines_via_iso_encoding, #readlines_with_main_encoding, #red, #register_sigint, #remove, #remove_directory, #remove_file, #rename_kde_konsole_tab, #replace_localhost_with_data, #report_pwd, #require_rescue, #reset_the_internal_hash, #return_all_directories_from_this_directory, #return_all_files_from_this_directory, #return_current_directory, #return_dd_mm_yyyy, #return_file_or_directory_of, #return_files_from_pwd, #return_last_part_of_the_current_directory, #return_utc, #rev, #right_arrow?, #right_colour, #roebe_log_directory?, #rosybrown, #royalblue, #ruby_base_directory?, #run_in_background, #run_rcfiles_then_run_ata_via_qdbus, #sandybrown, #sdir, #seagreen, #set_be_verbose, #set_xorg_buffer, #sfancy, #sfile, #show_help, #silent_redirection?, #simp, #simple_esystem, #skyblue, #slateblue, #slategray, #springgreen, #steelblue, #string_italic, #swarn, #symlink, #teal, #temp_dir?, #to_camelcase, #to_counted_hash, #tomato, #touch, #try_to_require_the_beautiful_url_gem, #try_to_require_the_html_template, #try_to_require_the_open_gem, #try_to_require_the_program_information_gem, #try_to_require_the_xorg_buffer, #use_colours?, #verbose_truth, #weekday?, #word_wrap, #write_what_into, #yellow
#append_onto_the_commandline_arguments, #clear_commandline_arguments, #commandline_arguments?, #commandline_arguments_as_string?, #commandline_arguments_without_leading_hyphens?, #first_argument?, #first_argument_without_leading_hyphens?, #has_an_argument_been_passed?, #remove_hyphened_arguments_from_the_commandline_arguments, #return_commandline_arguments_with_leading_hyphens, #second_argument?, #set_commandline_arguments
Constructor Details
#initialize(use_this_url = nil, run_already = true) ⇒ DownloadFromThisUrl
43
44
45
46
47
48
49
50
51
52
53
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 43
def initialize(
use_this_url = nil,
run_already = true
)
reset
set_commandline_arguments(
use_this_url
)
set_url(use_this_url)
run if run_already
end
|
Class Method Details
.[](i = '') ⇒ Object
#
Roebe::DownloadFromThisUrl[]
#
257
258
259
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 257
def self.[](i = '')
new(i)
end
|
Instance Method Details
#do_filter(i) ⇒ Object
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 112
def do_filter(i)
use_this_filter = nil
if @filter_for
use_this_filter = @filter_for.map {|line|
'.'+line.to_s
}
end
if i.is_a?(Array) and use_this_filter
i.select! {|line| use_this_filter.any? {|this_filter|
line.include? this_filter
}
}
end
set_remote_dataset(i)
end
|
#download_these_files(i) ⇒ Object
#
download_these_files (download tag)
#
178
179
180
181
182
183
184
185
186
187
188
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 178
def download_these_files(i)
if i.is_a? Array
i.each {|this_file|
e "Now downloading #{sfile(this_file)}:"
from_this_resource = remote_base_url?+this_file
_ = "wget #{from_this_resource}"
e royalblue(" #{_}")
system _
}
end
end
|
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 233
def (
i = return_commandline_arguments_with_leading_hyphens
)
if i.is_a? Array
i.each {|entry| (entry) }
else
case i
when /^-?-?no(-|_| )?filters?$/i
@filter_for = nil
end
end
end
|
#obtain_all_entries_from_the_remote_website(i = url?
) ⇒ Object
#
obtain_all_entries_from_the_remote_website
#
217
218
219
220
221
222
223
224
225
226
227
228
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 217
def obtain_all_entries_from_the_remote_website(
i = url?
)
e 'Reading all entries from `'+sfancy(i)+'` next.'
begin
@remote_dataset = URI.open(i).read
rescue Net::FTPPermError => error e 'Net::FTPPermError occurred:'
pp error
@remote_dataset = nil
end
end
|
#remote_base_url? ⇒ Boolean
136
137
138
139
140
141
142
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 136
def remote_base_url?
_ = @url
unless _.end_with? '/'
_ = _[0 .. _.rindex('/')]
end
_
end
|
#remote_dataset? ⇒ Boolean
Also known as:
main_dataset?
82
83
84
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 82
def remote_dataset?
@remote_dataset
end
|
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 58
def reset
super()
@remote_dataset = nil @filter_for = [
:pdf,
:csv,
:gz,
:txt,
:bz2,
:"tar.bz2",
:"tar.gz",
:"tar.xz"
] end
|
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 193
def run
obtain_all_entries_from_the_remote_website
if @remote_dataset
scanned = @remote_dataset.scan(/<a href=".+"/)
if @filter_for
e 'We will filter for these file types: '+
royalblue(
@filter_for.join(', ')
)
do_filter(scanned)
end
scan_for_proper_entries
end
end
|
#scan_for_proper_entries ⇒ Object
#
scan_for_proper_entries
#
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 147
def scan_for_proper_entries
_ = main_dataset?
scanned = _.map {|line|
line.scan(NON_GREEDY_REGEX_FOR_A_HREF_LINKS).flatten }.flatten
if scanned.empty?
e tomato('No files were found that fit.')
e 'The regex we used for this scan was: '+sfancy(regex?)
e
e 'The main dataset was:'
cliner
pp _
cliner
else
download_these_files(scanned)
end
end
|
#set_remote_dataset(i) ⇒ Object
105
106
107
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 105
def set_remote_dataset(i)
@remote_dataset = i
end
|
#set_url(i = '') ⇒ Object
89
90
91
92
93
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 89
def set_url(i = '')
i = i.first if i.is_a? Array
i = i.to_s.dup
@url = i
end
|
#url? ⇒ Boolean
98
99
100
|
# File 'lib/roebe/classes/download_from_this_url.rb', line 98
def url?
@url
end
|