|
|
|
@ -44,6 +44,83 @@ module Mastodon |
|
|
|
|
say("Removed #{processed} media attachments (approx. #{number_to_human_size(aggregate)}) #{dry_run}", :green, true) |
|
|
|
|
end |
|
|
|
|
|
|
|
|
|
option :start_after |
|
|
|
|
option :dry_run, type: :boolean, default: false |
|
|
|
|
desc 'remove-orphans', 'Scan storage and check for files that do not belong to existing media attachments' |
|
|
|
|
long_desc <<~LONG_DESC |
|
|
|
|
Scans file storage for files that do not belong to existing media attachments. Because this operation |
|
|
|
|
requires iterating over every single file individually, it will be slow. |
|
|
|
|
|
|
|
|
|
Please mind that some storage providers charge for the necessary API requests to list objects. |
|
|
|
|
LONG_DESC |
|
|
|
|
def remove_orphans |
|
|
|
|
progress = create_progress_bar(nil) |
|
|
|
|
reclaimed_bytes = 0 |
|
|
|
|
removed = 0 |
|
|
|
|
dry_run = options[:dry_run] ? ' (DRY RUN)' : '' |
|
|
|
|
|
|
|
|
|
case Paperclip::Attachment.default_options[:storage] |
|
|
|
|
when :s3 |
|
|
|
|
paperclip_instance = MediaAttachment.new.file |
|
|
|
|
s3_interface = paperclip_instance.s3_interface |
|
|
|
|
bucket = s3_interface.bucket(Paperclip::Attachment.default_options[:s3_credentials][:bucket]) |
|
|
|
|
last_key = options[:start_after] |
|
|
|
|
|
|
|
|
|
loop do |
|
|
|
|
objects = bucket.objects(start_after: last_key, prefix: 'media_attachments/files/').limit(1000).map { |x| x } |
|
|
|
|
|
|
|
|
|
break if objects.empty? |
|
|
|
|
|
|
|
|
|
last_key = objects.last.key |
|
|
|
|
attachments_map = MediaAttachment.where(id: objects.map { |object| object.key.split('/')[2..-2].join.to_i }).each_with_object({}) { |attachment, map| map[attachment.id] = attachment } |
|
|
|
|
|
|
|
|
|
objects.each do |object| |
|
|
|
|
attachment_id = object.key.split('/')[2..-2].join.to_i |
|
|
|
|
filename = object.key.split('/').last |
|
|
|
|
|
|
|
|
|
progress.increment |
|
|
|
|
|
|
|
|
|
next unless attachments_map[attachment_id].nil? || !attachments_map[attachment_id].variant?(filename) |
|
|
|
|
|
|
|
|
|
reclaimed_bytes += object.size |
|
|
|
|
removed += 1 |
|
|
|
|
object.delete unless options[:dry_run] |
|
|
|
|
progress.log("Found and removed orphan: #{object.key}") |
|
|
|
|
end |
|
|
|
|
end |
|
|
|
|
when :fog |
|
|
|
|
say('The fog storage driver is not supported for this operation at this time', :red) |
|
|
|
|
exit(1) |
|
|
|
|
when :filesystem |
|
|
|
|
require 'find' |
|
|
|
|
|
|
|
|
|
root_path = ENV.fetch('RAILS_ROOT_PATH', File.join(':rails_root', 'public', 'system')).gsub(':rails_root', Rails.root.to_s) |
|
|
|
|
|
|
|
|
|
Find.find(File.join(root_path, 'media_attachments', 'files')) do |path| |
|
|
|
|
next if File.directory?(path) |
|
|
|
|
|
|
|
|
|
key = path.gsub("#{root_path}#{File::SEPARATOR}", '') |
|
|
|
|
attachment_id = key.split(File::SEPARATOR)[2..-2].join.to_i |
|
|
|
|
filename = key.split(File::SEPARATOR).last |
|
|
|
|
attachment = MediaAttachment.find_by(id: attachment_id) |
|
|
|
|
|
|
|
|
|
progress.increment |
|
|
|
|
|
|
|
|
|
next unless attachment.nil? || !attachment.variant?(filename) |
|
|
|
|
|
|
|
|
|
reclaimed_bytes += File.size(path) |
|
|
|
|
removed += 1 |
|
|
|
|
File.delete(path) unless options[:dry_run] |
|
|
|
|
progress.log("Found and removed orphan: #{key}") |
|
|
|
|
end |
|
|
|
|
end |
|
|
|
|
|
|
|
|
|
progress.total = progress.progress |
|
|
|
|
progress.finish |
|
|
|
|
|
|
|
|
|
say("Removed #{removed} orphans (approx. #{number_to_human_size(reclaimed_bytes)})#{dry_run}", :green, true) |
|
|
|
|
end |
|
|
|
|
|
|
|
|
|
option :account, type: :string |
|
|
|
|
option :domain, type: :string |
|
|
|
|
option :status, type: :numeric |
|
|
|
|