You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

62 lines
4.5 KiB

  1. # frozen_string_literal: true
  2. require_relative '../../config/boot'
  3. require_relative '../../config/environment'
  4. require_relative 'cli_helper'
  5. module Mastodon
  6. class StatusesCLI < Thor
  7. include ActionView::Helpers::NumberHelper
  8. def self.exit_on_failure?
  9. true
  10. end
  11. option :days, type: :numeric, default: 90
  12. desc 'remove', 'Remove unreferenced statuses'
  13. long_desc <<~LONG_DESC
  14. Remove statuses that are not referenced by local user activity, such as
  15. ones that came from relays, or belonging to users that were once followed
  16. by someone locally but no longer are.
  17. This is a computationally heavy procedure that creates extra database
  18. indicides before commencing, and removes them afterward.
  19. LONG_DESC
  20. def remove
  21. say('Creating temporary database indices...')
  22. ActiveRecord::Base.connection.add_index(:accounts, :id, name: :index_accounts_local, where: 'domain is null', algorithm: :concurrently) unless ActiveRecord::Base.connection.index_name_exists?(:accounts, :index_accounts_local)
  23. ActiveRecord::Base.connection.add_index(:status_pins, :status_id, name: :index_status_pins_status_id, algorithm: :concurrently) unless ActiveRecord::Base.connection.index_name_exists?(:status_pins, :index_status_pins_status_id)
  24. ActiveRecord::Base.connection.add_index(:media_attachments, :remote_url, name: :index_media_attachments_remote_url, where: 'remote_url is not null', algorithm: :concurrently) unless ActiveRecord::Base.connection.index_name_exists?(:media_attachments, :index_media_attachments_remote_url)
  25. max_id = Mastodon::Snowflake.id_at(options[:days].days.ago)
  26. start_at = Time.now.to_f
  27. say('Beginning removal... This might take a while...')
  28. Status.remote
  29. .where('id < ?', max_id)
  30. .where(reblog_of_id: nil) # Skip reblogs
  31. .where(in_reply_to_id: nil) # Skip replies
  32. .where('id NOT IN (SELECT status_pins.status_id FROM status_pins WHERE statuses.id = status_id)') # Skip statuses that are pinned on profiles
  33. .where('id NOT IN (SELECT mentions.status_id FROM mentions WHERE statuses.id = mentions.status_id AND mentions.account_id IN (SELECT accounts.id FROM accounts WHERE domain IS NULL))') # Skip statuses that mention local accounts
  34. .where('id NOT IN (SELECT statuses1.in_reply_to_id FROM statuses AS statuses1 WHERE statuses.id = statuses1.in_reply_to_id)') # Skip statuses favourited by local accounts
  35. .where('id NOT IN (SELECT statuses1.reblog_of_id FROM statuses AS statuses1 WHERE statuses.id = statuses1.reblog_of_id AND statuses1.account_id IN (SELECT accounts.id FROM accounts WHERE accounts.domain IS NULL))') # Skip statuses reblogged by local accounts
  36. .where('account_id NOT IN (SELECT follows.target_account_id FROM follows WHERE statuses.account_id = follows.target_account_id)') # Skip accounts followed by local accounts
  37. .in_batches
  38. .delete_all
  39. say('Beginning removal of now-orphaned media attachments to free up disk space...')
  40. Scheduler::MediaCleanupScheduler.new.perform
  41. say("Done after #{Time.now.to_f - start_at}s", :green)
  42. ensure
  43. say('Removing temporary database indices to restore write performance...')
  44. ActiveRecord::Base.connection.remove_index(:accounts, name: :index_accounts_local) if ActiveRecord::Base.connection.index_name_exists?(:accounts, :index_accounts_local)
  45. ActiveRecord::Base.connection.remove_index(:status_pins, name: :index_status_pins_status_id) if ActiveRecord::Base.connection.index_name_exists?(:status_pins, :index_status_pins_status_id)
  46. ActiveRecord::Base.connection.remove_index(:media_attachments, name: :index_media_attachments_remote_url) if ActiveRecord::Base.connection.index_name_exists?(:media_attachments, :index_media_attachments_remote_url)
  47. end
  48. end
  49. end