Method List
-
#== Wgit::Document
-
#[] Wgit::Document
-
#absolute? Wgit::Url
-
#adapter_response Wgit::Response
-
#add_total_time Wgit::Response
-
#assert_arr_types Wgit::Assertable
-
#assert_required_keys Wgit::Assertable
-
#assert_respond_to Wgit::Assertable
-
#assert_types Wgit::Assertable
-
#at_css Wgit::Document
-
#at_xpath Wgit::Document
-
#base_url Wgit::Document
-
#body Wgit::Response
-
#body_or_nil Wgit::Response
-
#browser_get Wgit::Crawler
-
#clear_db Wgit::Database
-
#clear_db! Wgit::DSL
-
#clear_docs Wgit::Database
-
#clear_urls Wgit::Database
-
#client Wgit::Database
-
common_insert_data Wgit::Model
-
common_update_data Wgit::Model
-
#concat Wgit::Url
-
connect Wgit::Database
-
#connection_string Wgit::DSL
-
#connection_string Wgit::Database
-
#crawl Wgit::DSL
-
#crawl_duration Wgit::Url
-
#crawl_site Wgit::Crawler
-
#crawl_site Wgit::DSL
-
#crawl_url Wgit::Crawler
-
#crawl_urls Wgit::Crawler
-
#crawled Wgit::Url
-
#crawled_urls Wgit::Database
-
#crawler Wgit::DSL
-
#crawler Wgit::Indexer
-
#create_collections Wgit::Database
-
#create_unique_indexes Wgit::Database
-
#css Wgit::Document
-
#date_crawled Wgit::Url
-
#db Wgit::Indexer
-
default_logger Wgit
-
define_extractor Wgit::Document
-
#delete Wgit::Database
-
#doc? Wgit::Database
-
#docs Wgit::Database
-
document Wgit::Model
-
each Wgit::Utils
-
#empty? Wgit::Document
-
#encode Wgit::Crawler
-
establish_connection Wgit::Database
-
#exists? Wgit::Database
-
#external_links Wgit::Document
-
#extract Wgit::Document
-
#extract Wgit::DSL
-
#extract_from_html Wgit::Document
-
#extract_from_object Wgit::Document
-
extractors Wgit::Document
-
#failure? Wgit::Response
-
#fetch Wgit::Crawler
-
fetch Wgit::Utils
-
#follow Wgit::DSL
-
format_sentence_length Wgit::Utils
-
#fragment? Wgit::Url
-
#get Wgit::Database
-
#get_browser_response Wgit::Crawler
-
#get_http_response Wgit::Crawler
-
#headers Wgit::Response
-
#html Wgit::Document
-
#http_get Wgit::Crawler
-
#index Wgit::DSL
-
#index? Wgit::Url
-
#index_site Wgit::Indexer
-
#index_site Wgit::DSL
-
#index_url Wgit::Indexer
-
#index_urls Wgit::Indexer
-
#index_www Wgit::Indexer
-
#index_www Wgit::DSL
-
#init_nokogiri Wgit::Document
-
#initialize Wgit::Crawler
-
#initialize Wgit::Database
-
#initialize Wgit::Url
-
#initialize Wgit::Response
-
#initialize Wgit::Document
-
#initialize Wgit::Indexer
-
#insert Wgit::Database
-
#inspect Wgit::Document
-
#inspect Wgit::Url
-
#internal_absolute_links Wgit::Document
-
#internal_links Wgit::Document
-
#invalid? Wgit::Url
-
#ip_address Wgit::Response
-
#keep_crawling? Wgit::Indexer
-
#last_response Wgit::DSL
-
#last_response Wgit::Crawler
-
#last_result Wgit::Database
-
logger Wgit
-
logger= Wgit
-
#make_absolute Wgit::Url
-
mode Wgit::Base
-
#next_internal_links Wgit::Crawler
-
#normalize Wgit::Url
-
#not_found? Wgit::Response
-
#num_docs Wgit::Database
-
#num_records Wgit::Database
-
#num_urls Wgit::Database
-
#ok? Wgit::Response
-
#omit Wgit::Url
-
#omit_base Wgit::Url
-
#omit_fragment Wgit::Url
-
#omit_leading_slash Wgit::Url
-
#omit_origin Wgit::Url
-
#omit_query Wgit::Url
-
#omit_slashes Wgit::Url
-
#omit_trailing_slash Wgit::Url
-
parse Wgit::Url
-
parse? Wgit::Url
-
#parse_javascript Wgit::Crawler
-
#parse_javascript_delay Wgit::Crawler
-
#parser Wgit::Document
-
#prefix_scheme Wgit::Url
-
printf_search_results Wgit::Utils
-
#query? Wgit::Url
-
#redirect? Wgit::Response
-
#redirect_count Wgit::Response
-
#redirect_limit Wgit::Crawler
-
#redirections Wgit::Response
-
#relative? Wgit::Url
-
remove_extractor Wgit::Document
-
remove_extractors Wgit::Document
-
#replace Wgit::Url
-
#reset Wgit::DSL
-
#resolve Wgit::Crawler
-
run Wgit::Base
-
sanitize Wgit::Utils
-
sanitize_arr Wgit::Utils
-
sanitize_str Wgit::Utils
-
#scheme_relative? Wgit::Url
-
#score Wgit::Document
-
#search Wgit::Document
-
#search Wgit::Database
-
#search Wgit::DSL
-
#search! Wgit::Document
-
#search! Wgit::Database
-
#search_text Wgit::Database
-
select_bson_types Wgit::Model
-
#setup Wgit::Base
-
#size Wgit::Response
-
#size Wgit::Document
-
#size Wgit::Database
-
#start Wgit::DSL
-
#stats Wgit::Database
-
#stats Wgit::Document
-
#status Wgit::Response
-
#success? Wgit::Response
-
supported_file_extensions Wgit::Crawler
-
#teardown Wgit::Base
-
text_elements Wgit::Document
-
text_elements_xpath Wgit::Document
-
#text_index Wgit::Database
-
time_stamp Wgit::Utils
-
#timeout Wgit::Crawler
-
#to_addressable_uri Wgit::Url
-
#to_base Wgit::Url
-
#to_brand Wgit::Url
-
#to_domain Wgit::Url
-
#to_endpoint Wgit::Url
-
#to_extension Wgit::Url
-
#to_fragment Wgit::Url
-
to_h Wgit::Utils
-
#to_h Wgit::Url
-
#to_h Wgit::Document
-
#to_host Wgit::Url
-
#to_json Wgit::Document
-
#to_origin Wgit::Url
-
#to_password Wgit::Url
-
#to_path Wgit::Url
-
#to_port Wgit::Url
-
#to_query Wgit::Url
-
#to_query_hash Wgit::Url
-
#to_scheme Wgit::Url
-
#to_sub_domain Wgit::Url
-
#to_uri Wgit::Url
-
#to_url String
-
#to_url Wgit::Url
-
#to_urls Enumerable
-
#to_urls! Enumerable
-
#to_user Wgit::Url
-
#total_time Wgit::Response
-
#uncrawled_urls Wgit::Database
-
#update Wgit::Database
-
#upsert Wgit::Database
-
url Wgit::Model
-
#url Wgit::Response
-
#url Wgit::Document
-
#url? Wgit::Database
-
#urls Wgit::Database
-
use_default_logger Wgit
-
#valid? Wgit::Url
-
version Wgit
-
version_str Wgit
-
#write_doc_to_db Wgit::Indexer
-
#write_urls_to_db Wgit::Indexer
-
#xpath Wgit::Document