Class: Ebooks::Archive

Inherits:
Object
  • Object
show all
Defined in:
lib/twitter_ebooks/archive.rb

Instance Attribute Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(username, path = nil, client = nil) ⇒ Archive

Returns a new instance of Archive.



42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
# File 'lib/twitter_ebooks/archive.rb', line 42

def initialize(username, path=nil, client=nil)
  @username = username
  @path = path || "corpus/#{username}.json"

  if File.directory?(@path)
    @path = File.join(@path, "#{username}.json")
  end

  @client = client || make_client

  if File.exists?(@path)
    @filetext = File.read(@path, :encoding => 'utf-8')
    @tweets = JSON.parse(@filetext, symbolize_names: true)
    log "Currently #{@tweets.length} tweets for #{@username}"
  else
    @tweets.nil?
    log "New archive for @#{username} at #{@path}"
  end
end

Instance Attribute Details

#tweetsObject (readonly)

Returns the value of attribute tweets.



11
12
13
# File 'lib/twitter_ebooks/archive.rb', line 11

def tweets
  @tweets
end

Instance Method Details

#make_clientObject



13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
# File 'lib/twitter_ebooks/archive.rb', line 13

def make_client
  if File.exists?(CONFIG_PATH)
    @config = JSON.parse(File.read(CONFIG_PATH), symbolize_names: true)
  else
    @config = {}

    puts "As Twitter no longer allows anonymous API access, you'll need to enter the auth details of any account to use for archiving. These will be stored in #{CONFIG_PATH} if you need to change them later."
    print "Consumer key: "
    @config[:consumer_key] = STDIN.gets.chomp
    print "Consumer secret: "
    @config[:consumer_secret] = STDIN.gets.chomp
    print "Access token: "
    @config[:oauth_token] = STDIN.gets.chomp
    print "Access secret: "
    @config[:oauth_token_secret] = STDIN.gets.chomp

    File.open(CONFIG_PATH, 'w') do |f|
      f.write(JSON.pretty_generate(@config))
    end
  end

  Twitter::REST::Client.new do |config|
    config.consumer_key = @config[:consumer_key]
    config.consumer_secret = @config[:consumer_secret]
    config.access_token = @config[:oauth_token]
    config.access_token_secret = @config[:oauth_token_secret]
  end
end

#syncObject



62
63
64
65
66
67
68
69
70
71
72
73
74
75
# File 'lib/twitter_ebooks/archive.rb', line 62

def sync
  # We use this structure to ensure that
  # a) if there's an issue opening the file, we error out before download
  # b) if there's an issue during download we restore the original
  File.open(@path, 'w') do |file|
    begin
      sync_to(file)
    rescue Exception
      file.seek(0)
      file.write(@filetext)
      raise
    end
  end
end

#sync_to(file) ⇒ Object



77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
# File 'lib/twitter_ebooks/archive.rb', line 77

def sync_to(file)
  retries = 0
  tweets = []
  max_id = nil

  opts = {
    count: 200,
    #include_rts: false,
    trim_user: true
  }

  opts[:since_id] = @tweets[0][:id] unless @tweets.nil?

  loop do
    opts[:max_id] = max_id unless max_id.nil?
    begin
      new = @client.user_timeline(@username, opts)
    rescue Twitter::Error::TooManyRequests
      log "Rate limit exceeded. Waiting for 5 mins before retry."
      sleep 60*5
      retry
    end
    break if new.length <= 1
    tweets += new
    log "Received #{tweets.length} new tweets"
    max_id = new.last.id
  end

  if tweets.length == 0
    log "No new tweets"
  else
    @tweets ||= []
    @tweets = tweets.map(&:attrs).each { |tw|
      tw.delete(:entities)
    } + @tweets
  end
  file.write(JSON.pretty_generate(@tweets))
end