2013-10-14 08:27:41 -04:00
|
|
|
module Jobs
|
|
|
|
class CleanUpUploads < Jobs::Scheduled
|
2014-02-05 18:14:41 -05:00
|
|
|
every 1.hour
|
2013-10-14 08:27:41 -04:00
|
|
|
|
|
|
|
def execute(args)
|
2013-10-16 04:55:42 -04:00
|
|
|
return unless SiteSetting.clean_up_uploads?
|
2013-10-14 08:27:41 -04:00
|
|
|
|
2017-06-07 16:53:15 -04:00
|
|
|
base_url = Discourse.store.internal? ? Discourse.store.relative_base_url : Discourse.store.absolute_base_url
|
|
|
|
s3_hostname = URI.parse(base_url).hostname
|
2017-10-06 01:20:01 -04:00
|
|
|
s3_cdn_hostname = URI.parse(SiteSetting.Upload.s3_cdn_url || "").hostname
|
2017-06-07 16:53:15 -04:00
|
|
|
|
2016-09-08 16:58:07 -04:00
|
|
|
# Any URLs in site settings are fair game
|
2016-11-01 23:14:02 -04:00
|
|
|
ignore_urls = [
|
2016-10-25 04:43:57 -04:00
|
|
|
SiteSetting.logo_url,
|
|
|
|
SiteSetting.logo_small_url,
|
|
|
|
SiteSetting.favicon_url,
|
2017-06-07 16:53:15 -04:00
|
|
|
SiteSetting.apple_touch_icon_url,
|
|
|
|
].map do |url|
|
2017-06-08 14:31:58 -04:00
|
|
|
if url.present?
|
|
|
|
url = url.dup
|
2017-09-28 05:38:53 -04:00
|
|
|
|
|
|
|
if s3_cdn_hostname.present? && s3_hostname.present?
|
|
|
|
url.gsub!(s3_cdn_hostname, s3_hostname)
|
|
|
|
end
|
|
|
|
|
2017-06-08 14:31:58 -04:00
|
|
|
url[base_url] && url[url.index(base_url)..-1]
|
|
|
|
else
|
|
|
|
nil
|
|
|
|
end
|
2017-06-07 16:53:15 -04:00
|
|
|
end.compact.uniq
|
2016-09-08 16:58:07 -04:00
|
|
|
|
2013-11-27 16:01:41 -05:00
|
|
|
grace_period = [SiteSetting.clean_orphan_uploads_grace_period_hours, 1].max
|
2013-10-14 08:27:41 -04:00
|
|
|
|
2016-11-01 23:14:02 -04:00
|
|
|
result = Upload.where("uploads.retain_hours IS NULL OR uploads.created_at < current_timestamp - interval '1 hour' * uploads.retain_hours")
|
|
|
|
.where("uploads.created_at < ?", grace_period.hour.ago)
|
|
|
|
.joins("LEFT JOIN post_uploads pu ON pu.upload_id = uploads.id")
|
|
|
|
.joins("LEFT JOIN users u ON u.uploaded_avatar_id = uploads.id")
|
2017-11-20 17:50:23 -05:00
|
|
|
.joins("LEFT JOIN user_avatars ua ON ua.gravatar_upload_id = uploads.id OR ua.custom_upload_id = uploads.id")
|
2016-11-01 23:14:02 -04:00
|
|
|
.joins("LEFT JOIN user_profiles up ON up.profile_background = uploads.url OR up.card_background = uploads.url")
|
2016-12-02 02:15:34 -05:00
|
|
|
.joins("LEFT JOIN categories c ON c.uploaded_logo_id = uploads.id OR c.uploaded_background_id = uploads.id")
|
2017-02-02 04:41:57 -05:00
|
|
|
.joins("LEFT JOIN custom_emojis ce ON ce.upload_id = uploads.id")
|
2017-05-08 11:38:48 -04:00
|
|
|
.joins("LEFT JOIN theme_fields tf ON tf.upload_id = uploads.id")
|
2016-11-01 23:14:02 -04:00
|
|
|
.where("pu.upload_id IS NULL")
|
|
|
|
.where("u.uploaded_avatar_id IS NULL")
|
|
|
|
.where("ua.gravatar_upload_id IS NULL AND ua.custom_upload_id IS NULL")
|
|
|
|
.where("up.profile_background IS NULL AND up.card_background IS NULL")
|
2016-12-02 02:15:34 -05:00
|
|
|
.where("c.uploaded_logo_id IS NULL AND c.uploaded_background_id IS NULL")
|
2017-11-20 17:50:23 -05:00
|
|
|
.where("ce.upload_id IS NULL")
|
|
|
|
.where("tf.upload_id IS NULL")
|
2017-06-07 16:53:15 -04:00
|
|
|
|
|
|
|
result = result.where("uploads.url NOT IN (?)", ignore_urls) if ignore_urls.present?
|
2013-10-14 08:27:41 -04:00
|
|
|
|
2016-08-01 12:35:57 -04:00
|
|
|
result.find_each do |upload|
|
2017-11-14 04:56:10 -05:00
|
|
|
if upload.sha1.present?
|
|
|
|
encoded_sha = Base62.encode(upload.sha1.hex)
|
|
|
|
next if QueuedPost.where("raw LIKE '%#{upload.sha1}%' OR raw LIKE '%#{encoded_sha}%'").exists?
|
|
|
|
next if Draft.where("data LIKE '%#{upload.sha1}%' OR data LIKE '%#{encoded_sha}%'").exists?
|
|
|
|
end
|
2016-08-01 12:35:57 -04:00
|
|
|
upload.destroy
|
2016-07-01 03:22:30 -04:00
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
2013-10-14 08:27:41 -04:00
|
|
|
end
|