Add retry for failed media downloads and tootctl media refresh (#11775)
				
					
				
			This commit is contained in:
		
							parent
							
								
									8674814825
								
							
						
					
					
						commit
						031ca25014
					
				@ -189,22 +189,25 @@ class ActivityPub::Activity::Create < ActivityPub::Activity
 | 
				
			|||||||
    media_attachments = []
 | 
					    media_attachments = []
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    as_array(@object['attachment']).each do |attachment|
 | 
					    as_array(@object['attachment']).each do |attachment|
 | 
				
			||||||
      next if attachment['url'].blank?
 | 
					      next if attachment['url'].blank? || media_attachments.size >= 4
 | 
				
			||||||
 | 
					
 | 
				
			||||||
      href             = Addressable::URI.parse(attachment['url']).normalize.to_s
 | 
					      begin
 | 
				
			||||||
      media_attachment = MediaAttachment.create(account: @account, remote_url: href, description: attachment['name'].presence, focus: attachment['focalPoint'], blurhash: supported_blurhash?(attachment['blurhash']) ? attachment['blurhash'] : nil)
 | 
					        href             = Addressable::URI.parse(attachment['url']).normalize.to_s
 | 
				
			||||||
      media_attachments << media_attachment
 | 
					        media_attachment = MediaAttachment.create(account: @account, remote_url: href, description: attachment['name'].presence, focus: attachment['focalPoint'], blurhash: supported_blurhash?(attachment['blurhash']) ? attachment['blurhash'] : nil)
 | 
				
			||||||
 | 
					        media_attachments << media_attachment
 | 
				
			||||||
 | 
					
 | 
				
			||||||
      next if unsupported_media_type?(attachment['mediaType']) || skip_download?
 | 
					        next if unsupported_media_type?(attachment['mediaType']) || skip_download?
 | 
				
			||||||
 | 
					
 | 
				
			||||||
      media_attachment.file_remote_url = href
 | 
					        media_attachment.file_remote_url = href
 | 
				
			||||||
      media_attachment.save
 | 
					        media_attachment.save
 | 
				
			||||||
 | 
					      rescue Mastodon::UnexpectedResponseError, HTTP::TimeoutError, HTTP::ConnectionError, OpenSSL::SSL::SSLError
 | 
				
			||||||
 | 
					        RedownloadMediaWorker.perform_in(rand(30..600).seconds, media_attachment.id)
 | 
				
			||||||
 | 
					      end
 | 
				
			||||||
    end
 | 
					    end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    media_attachments
 | 
					    media_attachments
 | 
				
			||||||
  rescue Addressable::URI::InvalidURIError => e
 | 
					  rescue Addressable::URI::InvalidURIError => e
 | 
				
			||||||
    Rails.logger.debug e
 | 
					    Rails.logger.debug "Invalid URL in attachment: #{e}"
 | 
				
			||||||
 | 
					 | 
				
			||||||
    media_attachments
 | 
					    media_attachments
 | 
				
			||||||
  end
 | 
					  end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
				
			|||||||
@ -4,7 +4,7 @@ module Remotable
 | 
				
			|||||||
  extend ActiveSupport::Concern
 | 
					  extend ActiveSupport::Concern
 | 
				
			||||||
 | 
					
 | 
				
			||||||
  class_methods do
 | 
					  class_methods do
 | 
				
			||||||
    def remotable_attachment(attachment_name, limit)
 | 
					    def remotable_attachment(attachment_name, limit, suppress_errors: true)
 | 
				
			||||||
      attribute_name  = "#{attachment_name}_remote_url".to_sym
 | 
					      attribute_name  = "#{attachment_name}_remote_url".to_sym
 | 
				
			||||||
      method_name     = "#{attribute_name}=".to_sym
 | 
					      method_name     = "#{attribute_name}=".to_sym
 | 
				
			||||||
      alt_method_name = "reset_#{attachment_name}!".to_sym
 | 
					      alt_method_name = "reset_#{attachment_name}!".to_sym
 | 
				
			||||||
@ -22,7 +22,7 @@ module Remotable
 | 
				
			|||||||
 | 
					
 | 
				
			||||||
        begin
 | 
					        begin
 | 
				
			||||||
          Request.new(:get, url).perform do |response|
 | 
					          Request.new(:get, url).perform do |response|
 | 
				
			||||||
            next if response.code != 200
 | 
					            raise Mastodon::UnexpectedResponseError, response unless (200...300).cover?(response.code)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
            content_type = parse_content_type(response.headers.get('content-type').last)
 | 
					            content_type = parse_content_type(response.headers.get('content-type').last)
 | 
				
			||||||
            extname      = detect_extname_from_content_type(content_type)
 | 
					            extname      = detect_extname_from_content_type(content_type)
 | 
				
			||||||
@ -41,11 +41,11 @@ module Remotable
 | 
				
			|||||||
 | 
					
 | 
				
			||||||
            self[attribute_name] = url if has_attribute?(attribute_name)
 | 
					            self[attribute_name] = url if has_attribute?(attribute_name)
 | 
				
			||||||
          end
 | 
					          end
 | 
				
			||||||
        rescue HTTP::TimeoutError, HTTP::ConnectionError, OpenSSL::SSL::SSLError, Paperclip::Errors::NotIdentifiedByImageMagickError, Addressable::URI::InvalidURIError, Mastodon::HostValidationError, Mastodon::LengthValidationError => e
 | 
					        rescue Mastodon::UnexpectedResponseError, HTTP::TimeoutError, HTTP::ConnectionError, OpenSSL::SSL::SSLError => e
 | 
				
			||||||
 | 
					          Rails.logger.debug "Error fetching remote #{attachment_name}: #{e}"
 | 
				
			||||||
 | 
					          raise e unless suppress_errors
 | 
				
			||||||
 | 
					        rescue Paperclip::Errors::NotIdentifiedByImageMagickError, Addressable::URI::InvalidURIError, Mastodon::HostValidationError, Mastodon::LengthValidationError, Paperclip::Error, Mastodon::DimensionsValidationError => e
 | 
				
			||||||
          Rails.logger.debug "Error fetching remote #{attachment_name}: #{e}"
 | 
					          Rails.logger.debug "Error fetching remote #{attachment_name}: #{e}"
 | 
				
			||||||
          nil
 | 
					 | 
				
			||||||
        rescue Paperclip::Error, Mastodon::DimensionsValidationError => e
 | 
					 | 
				
			||||||
          Rails.logger.debug "Error processing remote #{attachment_name}: #{e}"
 | 
					 | 
				
			||||||
          nil
 | 
					          nil
 | 
				
			||||||
        end
 | 
					        end
 | 
				
			||||||
      end
 | 
					      end
 | 
				
			||||||
 | 
				
			|||||||
@ -118,7 +118,7 @@ class MediaAttachment < ApplicationRecord
 | 
				
			|||||||
  validates_attachment_content_type :file, content_type: IMAGE_MIME_TYPES + VIDEO_MIME_TYPES + AUDIO_MIME_TYPES
 | 
					  validates_attachment_content_type :file, content_type: IMAGE_MIME_TYPES + VIDEO_MIME_TYPES + AUDIO_MIME_TYPES
 | 
				
			||||||
  validates_attachment_size :file, less_than: IMAGE_LIMIT, unless: :larger_media_format?
 | 
					  validates_attachment_size :file, less_than: IMAGE_LIMIT, unless: :larger_media_format?
 | 
				
			||||||
  validates_attachment_size :file, less_than: VIDEO_LIMIT, if: :larger_media_format?
 | 
					  validates_attachment_size :file, less_than: VIDEO_LIMIT, if: :larger_media_format?
 | 
				
			||||||
  remotable_attachment :file, VIDEO_LIMIT
 | 
					  remotable_attachment :file, VIDEO_LIMIT, suppress_errors: false
 | 
				
			||||||
 | 
					
 | 
				
			||||||
  include Attachmentable
 | 
					  include Attachmentable
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
				
			|||||||
							
								
								
									
										19
									
								
								app/workers/redownload_media_worker.rb
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										19
									
								
								app/workers/redownload_media_worker.rb
									
									
									
									
									
										Normal file
									
								
							@ -0,0 +1,19 @@
 | 
				
			|||||||
 | 
					# frozen_string_literal: true
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					class RedownloadMediaWorker
 | 
				
			||||||
 | 
					  include Sidekiq::Worker
 | 
				
			||||||
 | 
					  include ExponentialBackoff
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  sidekiq_options queue: 'pull', retry: 3
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  def perform(id)
 | 
				
			||||||
 | 
					    media_attachment = MediaAttachment.find(id)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    return if media_attachment.remote_url.blank?
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    media_attachment.reset_file!
 | 
				
			||||||
 | 
					    media_attachment.save
 | 
				
			||||||
 | 
					  rescue ActiveRecord::RecordNotFound
 | 
				
			||||||
 | 
					    true
 | 
				
			||||||
 | 
					  end
 | 
				
			||||||
 | 
					end
 | 
				
			||||||
@ -43,5 +43,59 @@ module Mastodon
 | 
				
			|||||||
 | 
					
 | 
				
			||||||
      say("Removed #{processed} media attachments (approx. #{number_to_human_size(aggregate)}) #{dry_run}", :green, true)
 | 
					      say("Removed #{processed} media attachments (approx. #{number_to_human_size(aggregate)}) #{dry_run}", :green, true)
 | 
				
			||||||
    end
 | 
					    end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    option :account, type: :string
 | 
				
			||||||
 | 
					    option :domain, type: :string
 | 
				
			||||||
 | 
					    option :status, type: :numeric
 | 
				
			||||||
 | 
					    option :concurrency, type: :numeric, default: 5, aliases: [:c]
 | 
				
			||||||
 | 
					    option :verbose, type: :boolean, default: false, aliases: [:v]
 | 
				
			||||||
 | 
					    option :dry_run, type: :boolean, default: false
 | 
				
			||||||
 | 
					    desc 'refresh', 'Fetch remote media files'
 | 
				
			||||||
 | 
					    long_desc <<-DESC
 | 
				
			||||||
 | 
					      Re-downloads media attachments from other servers. You must specify the
 | 
				
			||||||
 | 
					      source of media attachments with one of the following options:
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      Use the --status option to download attachments from a specific status,
 | 
				
			||||||
 | 
					      using the status local numeric ID.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      Use the --account option to download attachments from a specific account,
 | 
				
			||||||
 | 
					      using username@domain handle of the account.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      Use the --domain option to download attachments from a specific domain.
 | 
				
			||||||
 | 
					    DESC
 | 
				
			||||||
 | 
					    def refresh
 | 
				
			||||||
 | 
					      dry_run = options[:dry_run] ? ' (DRY RUN)' : ''
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      if options[:status]
 | 
				
			||||||
 | 
					        scope = MediaAttachment.where(status_id: options[:status])
 | 
				
			||||||
 | 
					      elsif options[:account]
 | 
				
			||||||
 | 
					        username, domain = username.split('@')
 | 
				
			||||||
 | 
					        account = Account.find_remote(username, domain)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					        if account.nil?
 | 
				
			||||||
 | 
					          say('No such account', :red)
 | 
				
			||||||
 | 
					          exit(1)
 | 
				
			||||||
 | 
					        end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					        scope = MediaAttachment.where(account_id: account.id)
 | 
				
			||||||
 | 
					      elsif options[:domain]
 | 
				
			||||||
 | 
					        scope = MediaAttachment.joins(:account).merge(Account.by_domain_and_subdomains(options[:domain]))
 | 
				
			||||||
 | 
					      else
 | 
				
			||||||
 | 
					        exit(1)
 | 
				
			||||||
 | 
					      end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      processed, aggregate = parallelize_with_progress(scope) do |media_attachment|
 | 
				
			||||||
 | 
					        next if media_attachment.remote_url.blank?
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					        unless options[:dry_run]
 | 
				
			||||||
 | 
					          media_attachment.reset_file!
 | 
				
			||||||
 | 
					          media_attachment.save
 | 
				
			||||||
 | 
					        end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					        media_attachment.file_file_size
 | 
				
			||||||
 | 
					      end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      say("Downloaded #{processed} media attachments (approx. #{number_to_human_size(aggregate)})#{dry_run}", :green, true)
 | 
				
			||||||
 | 
					    end
 | 
				
			||||||
  end
 | 
					  end
 | 
				
			||||||
end
 | 
					end
 | 
				
			||||||
 | 
				
			|||||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user