Class: Jobs::CleanUpUploads

Inherits:
Scheduled show all
Defined in:
app/jobs/scheduled/clean_up_uploads.rb

Instance Method Summary collapse

Methods inherited from Scheduled

#perform

Methods inherited from Base

acquire_cluster_concurrency_lock!, clear_cluster_concurrency_lock!, cluster_concurrency, cluster_concurrency_redis_key, delayed_perform, #error_context, get_cluster_concurrency, #last_db_duration, #log, #perform, #perform_immediately

Instance Method Details

#execute(args) ⇒ Object



7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
# File 'app/jobs/scheduled/clean_up_uploads.rb', line 7

def execute(args)
  grace_period = [SiteSetting.clean_orphan_uploads_grace_period_hours, 1].max

  # always remove invalid upload records
  Upload
    .by_users
    .where(
      "retain_hours IS NULL OR created_at < current_timestamp - interval '1 hour' * retain_hours",
    )
    .where("created_at < ?", grace_period.hour.ago)
    .where(url: "")
    .find_each(&:destroy!)

  return unless SiteSetting.clean_up_uploads?

  if c = last_cleanup
    return if (Time.zone.now.to_i - c) < (grace_period / 2).hours
  end

  base_url =
    (
      if Discourse.store.internal?
        Discourse.store.relative_base_url
      else
        Discourse.store.absolute_base_url
      end
    )
  s3_hostname = URI.parse(base_url).hostname
  s3_cdn_hostname = URI.parse(SiteSetting.Upload.s3_cdn_url || "").hostname

  result = Upload.by_users
  Upload.unused_callbacks&.each { |handler| result = handler.call(result) }
  result =
    result
      .where(
        "uploads.retain_hours IS NULL OR uploads.created_at < current_timestamp - interval '1 hour' * uploads.retain_hours",
      )
      .where("uploads.created_at < ?", grace_period.hour.ago)
      .where("uploads.access_control_post_id IS NULL")
      .joins("LEFT JOIN upload_references ON upload_references.upload_id = uploads.id")
      .where("upload_references.upload_id IS NULL")
      .with_no_non_post_relations

  result.find_each do |upload|
    next if Upload.in_use_callbacks&.any? { |callback| callback.call(upload) }

    if upload.sha1.present?
      # TODO: Remove this check after UploadReferences records were created
      encoded_sha = Base62.encode(upload.sha1.hex)
      if ReviewableQueuedPost
           .pending
           .where(
             "payload->>'raw' LIKE ? OR payload->>'raw' LIKE ?",
             "%#{upload.sha1}%",
             "%#{encoded_sha}%",
           )
           .exists?
        next
      end
      if Draft.where(
           "data LIKE ? OR data LIKE ?",
           "%#{upload.sha1}%",
           "%#{encoded_sha}%",
         ).exists?
        next
      end
      if UserProfile.where(
           "bio_raw LIKE ? OR bio_raw LIKE ?",
           "%#{upload.sha1}%",
           "%#{encoded_sha}%",
         ).exists?
        next
      end

      upload.destroy
    else
      upload.delete
    end
  end

  ExternalUploadStub.cleanup!

  self.last_cleanup = Time.zone.now.to_i
end

#last_cleanupObject



96
97
98
99
# File 'app/jobs/scheduled/clean_up_uploads.rb', line 96

def last_cleanup
  v = Discourse.redis.get(last_cleanup_key)
  v ? v.to_i : v
end

#last_cleanup=(v) ⇒ Object



92
93
94
# File 'app/jobs/scheduled/clean_up_uploads.rb', line 92

def last_cleanup=(v)
  Discourse.redis.setex(last_cleanup_key, 7.days.to_i, v.to_s)
end

#reset_last_cleanup!Object



101
102
103
# File 'app/jobs/scheduled/clean_up_uploads.rb', line 101

def reset_last_cleanup!
  Discourse.redis.del(last_cleanup_key)
end