2019-05-03 06:17:27 +08:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
2013-10-14 20:27:41 +08:00
|
|
|
module Jobs
|
2019-10-02 12:01:53 +08:00
|
|
|
class CleanUpUploads < ::Jobs::Scheduled
|
2014-02-06 07:14:41 +08:00
|
|
|
every 1.hour
|
2013-10-14 20:27:41 +08:00
|
|
|
|
|
|
|
def execute(args)
|
2018-06-05 00:40:57 +08:00
|
|
|
grace_period = [SiteSetting.clean_orphan_uploads_grace_period_hours, 1].max
|
2018-06-05 01:06:52 +08:00
|
|
|
|
2018-06-05 00:40:57 +08:00
|
|
|
# always remove invalid upload records
|
|
|
|
Upload
|
2019-01-02 15:29:17 +08:00
|
|
|
.by_users
|
2018-06-05 00:40:57 +08:00
|
|
|
.where("retain_hours IS NULL OR created_at < current_timestamp - interval '1 hour' * retain_hours")
|
|
|
|
.where("created_at < ?", grace_period.hour.ago)
|
2018-06-05 00:43:00 +08:00
|
|
|
.where(url: "")
|
2018-07-02 12:41:53 +08:00
|
|
|
.find_each(&:destroy!)
|
2018-06-05 01:06:52 +08:00
|
|
|
|
2013-10-16 16:55:42 +08:00
|
|
|
return unless SiteSetting.clean_up_uploads?
|
2013-10-14 20:27:41 +08:00
|
|
|
|
2019-10-28 08:14:52 +08:00
|
|
|
if c = last_cleanup
|
|
|
|
return if (Time.zone.now.to_i - c) < (grace_period / 2).hours
|
|
|
|
end
|
|
|
|
|
2017-06-08 04:53:15 +08:00
|
|
|
base_url = Discourse.store.internal? ? Discourse.store.relative_base_url : Discourse.store.absolute_base_url
|
|
|
|
s3_hostname = URI.parse(base_url).hostname
|
2017-10-06 13:20:01 +08:00
|
|
|
s3_cdn_hostname = URI.parse(SiteSetting.Upload.s3_cdn_url || "").hostname
|
2017-06-08 04:53:15 +08:00
|
|
|
|
2016-09-09 04:58:07 +08:00
|
|
|
# Any URLs in site settings are fair game
|
2016-11-02 11:14:02 +08:00
|
|
|
ignore_urls = [
|
2018-07-18 18:57:43 +08:00
|
|
|
*SiteSetting.selectable_avatars.split("\n"),
|
|
|
|
].flatten.map do |url|
|
2017-06-09 02:31:58 +08:00
|
|
|
if url.present?
|
|
|
|
url = url.dup
|
2017-09-28 17:38:53 +08:00
|
|
|
|
|
|
|
if s3_cdn_hostname.present? && s3_hostname.present?
|
|
|
|
url.gsub!(s3_cdn_hostname, s3_hostname)
|
|
|
|
end
|
|
|
|
|
2017-06-09 02:31:58 +08:00
|
|
|
url[base_url] && url[url.index(base_url)..-1]
|
|
|
|
else
|
|
|
|
nil
|
|
|
|
end
|
2017-06-08 04:53:15 +08:00
|
|
|
end.compact.uniq
|
2016-09-09 04:58:07 +08:00
|
|
|
|
2019-01-02 15:29:17 +08:00
|
|
|
result = Upload.by_users
|
|
|
|
.where("uploads.retain_hours IS NULL OR uploads.created_at < current_timestamp - interval '1 hour' * uploads.retain_hours")
|
2016-11-02 11:14:02 +08:00
|
|
|
.where("uploads.created_at < ?", grace_period.hour.ago)
|
2020-01-16 11:50:27 +08:00
|
|
|
.where("uploads.access_control_post_id IS NULL")
|
2018-11-14 15:03:02 +08:00
|
|
|
.joins(<<~SQL)
|
|
|
|
LEFT JOIN site_settings ss
|
2018-11-30 10:46:39 +08:00
|
|
|
ON NULLIF(ss.value, '')::integer = uploads.id
|
2018-11-14 15:03:02 +08:00
|
|
|
AND ss.data_type = #{SiteSettings::TypeSupervisor.types[:upload].to_i}
|
|
|
|
SQL
|
2016-11-02 11:14:02 +08:00
|
|
|
.joins("LEFT JOIN post_uploads pu ON pu.upload_id = uploads.id")
|
|
|
|
.joins("LEFT JOIN users u ON u.uploaded_avatar_id = uploads.id")
|
2017-11-21 06:50:23 +08:00
|
|
|
.joins("LEFT JOIN user_avatars ua ON ua.gravatar_upload_id = uploads.id OR ua.custom_upload_id = uploads.id")
|
2019-04-29 11:58:52 +08:00
|
|
|
.joins("LEFT JOIN user_profiles up ON up.profile_background_upload_id = uploads.id OR up.card_background_upload_id = uploads.id")
|
2019-01-10 09:37:21 +08:00
|
|
|
.joins("LEFT JOIN categories c ON c.uploaded_logo_id = uploads.id OR c.uploaded_background_id = uploads.id")
|
2017-02-02 17:41:57 +08:00
|
|
|
.joins("LEFT JOIN custom_emojis ce ON ce.upload_id = uploads.id")
|
2017-05-08 23:38:48 +08:00
|
|
|
.joins("LEFT JOIN theme_fields tf ON tf.upload_id = uploads.id")
|
2018-04-19 19:30:31 +08:00
|
|
|
.joins("LEFT JOIN user_exports ue ON ue.upload_id = uploads.id")
|
2020-05-25 13:38:47 +08:00
|
|
|
.joins("LEFT JOIN groups g ON g.flair_upload_id = uploads.id")
|
2016-11-02 11:14:02 +08:00
|
|
|
.where("pu.upload_id IS NULL")
|
|
|
|
.where("u.uploaded_avatar_id IS NULL")
|
|
|
|
.where("ua.gravatar_upload_id IS NULL AND ua.custom_upload_id IS NULL")
|
2019-04-29 11:58:52 +08:00
|
|
|
.where("up.profile_background_upload_id IS NULL AND up.card_background_upload_id IS NULL")
|
2016-12-02 15:15:34 +08:00
|
|
|
.where("c.uploaded_logo_id IS NULL AND c.uploaded_background_id IS NULL")
|
2017-11-21 06:50:23 +08:00
|
|
|
.where("ce.upload_id IS NULL")
|
|
|
|
.where("tf.upload_id IS NULL")
|
2018-04-19 19:30:31 +08:00
|
|
|
.where("ue.upload_id IS NULL")
|
2020-05-25 13:38:47 +08:00
|
|
|
.where("g.flair_upload_id IS NULL")
|
2018-11-14 15:03:02 +08:00
|
|
|
.where("ss.value IS NULL")
|
2017-06-08 04:53:15 +08:00
|
|
|
|
|
|
|
result = result.where("uploads.url NOT IN (?)", ignore_urls) if ignore_urls.present?
|
2013-10-14 20:27:41 +08:00
|
|
|
|
2016-08-02 00:35:57 +08:00
|
|
|
result.find_each do |upload|
|
2017-11-14 17:56:10 +08:00
|
|
|
if upload.sha1.present?
|
|
|
|
encoded_sha = Base62.encode(upload.sha1.hex)
|
2019-04-13 02:39:32 +08:00
|
|
|
next if ReviewableQueuedPost.pending.where("payload->>'raw' LIKE '%#{upload.sha1}%' OR payload->>'raw' LIKE '%#{encoded_sha}%'").exists?
|
2017-11-14 17:56:10 +08:00
|
|
|
next if Draft.where("data LIKE '%#{upload.sha1}%' OR data LIKE '%#{encoded_sha}%'").exists?
|
2017-11-21 17:20:42 +08:00
|
|
|
upload.destroy
|
|
|
|
else
|
|
|
|
upload.delete
|
2017-11-14 17:56:10 +08:00
|
|
|
end
|
2016-07-01 15:22:30 +08:00
|
|
|
end
|
2019-10-28 08:14:52 +08:00
|
|
|
|
|
|
|
self.last_cleanup = Time.zone.now.to_i
|
|
|
|
end
|
|
|
|
|
|
|
|
def last_cleanup=(v)
|
2019-12-03 17:05:53 +08:00
|
|
|
Discourse.redis.setex(last_cleanup_key, 7.days.to_i, v.to_s)
|
2019-10-28 08:14:52 +08:00
|
|
|
end
|
|
|
|
|
|
|
|
def last_cleanup
|
2019-12-03 17:05:53 +08:00
|
|
|
v = Discourse.redis.get(last_cleanup_key)
|
2019-10-28 08:14:52 +08:00
|
|
|
v ? v.to_i : v
|
2016-07-01 15:22:30 +08:00
|
|
|
end
|
2019-10-28 08:14:52 +08:00
|
|
|
|
|
|
|
def reset_last_cleanup!
|
2019-12-03 17:05:53 +08:00
|
|
|
Discourse.redis.del(last_cleanup_key)
|
2019-10-28 08:14:52 +08:00
|
|
|
end
|
|
|
|
|
|
|
|
protected
|
|
|
|
|
|
|
|
def last_cleanup_key
|
|
|
|
"LAST_UPLOAD_CLEANUP"
|
|
|
|
end
|
|
|
|
|
2016-07-01 15:22:30 +08:00
|
|
|
end
|
2013-10-14 20:27:41 +08:00
|
|
|
end
|