about summary refs log tree commit diff
path: root/app/workers/scheduler
diff options
context:
space:
mode:
authormultiple creatures <dev@multiple-creature.party>2019-08-03 05:32:49 -0500
committermultiple creatures <dev@multiple-creature.party>2019-08-03 05:32:49 -0500
commit6613005ae63bdc31a818d7488c36a130b558a903 (patch)
treec5ac9032e4b87413f902b0e0be087fb0c476a1e1 /app/workers/scheduler
parent99d1b1ff6f482df13d6917d5340ec28baaf76302 (diff)
`monsterpit-janitor` is now built in as a sidekiq job (with better code)
Diffstat (limited to 'app/workers/scheduler')
-rw-r--r--app/workers/scheduler/janitor_scheduler.rb148
1 files changed, 148 insertions, 0 deletions
diff --git a/app/workers/scheduler/janitor_scheduler.rb b/app/workers/scheduler/janitor_scheduler.rb
new file mode 100644
index 000000000..70d1c4ea0
--- /dev/null
+++ b/app/workers/scheduler/janitor_scheduler.rb
@@ -0,0 +1,148 @@
+# frozen_string_literal: true
+
+class Scheduler::JanitorScheduler
+  include Sidekiq::Worker
+  include BlocklistHelper
+  include BangtagHelper
+
+  MIN_POSTS = 6
+
+  sidekiq_options unique: :until_executed, retry: 0
+
+  def perform
+    @account = admin_account
+    return if @account.nil?
+
+    @exclude_ids = excluded_account_ids
+    @exclude_domains = excluded_domains
+    @exclude_markov = excluded_accounts_from_env('MARKOV')
+
+    prune_deleted_accounts!
+    suspend_abandoned_accounts!
+    suspend_spammers!
+    silence_markov!
+    import_blocklists!
+  end
+
+  private
+
+  def prune_deleted_accounts!
+    Account.local.where.not(suspended_at: nil).destroy_all
+  end
+
+  def suspend_abandoned_accounts!
+    reason = "Appears to be abandoned. Freeing up the username for someone else."
+    abandoned_accounts.find_each do |account|
+      account_policy(account.username, nil, :suspend, reason)
+    end
+  end
+
+  def suspend_spammers!
+    reason = 'Appears to be a spammer account.'
+    spammer_accounts.find_each do |spammer|
+      account_policy(spammer.username, spammer.domain, :suspend, reason)
+    end
+  end
+
+  def silence_markov!
+    reason = 'Appears to be a markov bot.'
+    markov_accounts.find_each do |markov|
+      account_policy(markov.username, markov.domain, :silence, reason)
+    end
+  end
+
+  def import_blocklists!
+    blocks = merged_blocklist.reject { |entry| entry[:domain].in?(@exclude_domains) }
+    blocks.each do |entry|
+      block = DomainBlock.create!(entry)
+      DomainBlockWorker.perform_async(block)
+      Admin::ActionLog.create(account: @account, action: :create, target: block)
+      user_friendly_action_log(@account, :create, block)
+    end
+  end
+
+
+
+  def admin_account
+    account_id = ENV.fetch('JANITOR_USER', '').to_i
+    return if account_id == 0
+    Account.find_by(id: account_id)
+  end
+
+  def spammer_accounts
+    spammer_ids = spammer_account_ids
+    Account.reorder(nil).where(id: spammer_ids, suspended_at: nil)
+      .where.not(id: @exclude_ids)
+  end
+
+  def markov_accounts
+    Account.reorder(nil).where(silenced_at: nil).where.not(id: @exclude_markov)
+      .where('username LIKE ? OR note ILIKE ?', '%ebooks%', '%markov%')
+  end
+
+  def abandoned_accounts
+    Account.reorder(nil).where(id: abandoned_account_ids)
+  end
+
+  def abandoned_users
+    User.select(:account_id).where('last_sign_in_at < ?', 3.months.ago)
+  end
+
+  def excluded_domains
+    existing_policy_domains | domains_from_account_ids | excluded_from_env('DOMAINS')
+  end
+
+
+  def abandoned_account_ids
+    AccountStat.select(:account_id)
+      .where(account_id: abandoned_users)
+      .where('statuses_count < ?', MIN_POSTS)
+  end
+
+  def excluded_account_ids
+    local_account_ids | outgoing_follow_ids | excluded_accounts_from_env('USERNAMES')
+  end
+
+  def spammer_account_ids
+    post_spammer_ids | card_spammer_ids
+  end
+
+  def existing_policy_domains
+    DomainBlock.all.pluck(:domain)
+  end
+
+  def domains_from_account_ids
+    Account.reorder(nil).where(id: @account_ids).pluck(:domain).uniq
+  end
+
+  def local_account_ids
+    Account.local.reorder(nil).pluck(:id)
+  end
+
+  def outgoing_follow_ids
+    Account.local.reorder(nil).flat_map { |account| account.following_ids }
+  end
+
+  def post_spammer_ids
+    Status.with_public_visibility
+      .reorder(nil)
+      .where('tsv @@ to_tsquery(?)', 'womenarestupid.site & /blog/:*')
+      .pluck(:account_id)
+  end
+
+  def card_spammer_ids
+    PreviewCard.where('url LIKE ? OR title ILIKE ?', '%womenarestupid%', '%womenaredumb%')
+      .reorder(nil)
+      .flat_map { |card| card.statuses.pluck(:account_id) }
+  end
+
+
+  def excluded_accounts_from_env(suffix)
+    excluded_usernames = ENV.fetch("JANITOR_EXCLUDE_#{suffix.upcase}", '').split
+    Account.reorder(nil).where(username: excluded_usernames).pluck(:id)
+  end
+
+  def excluded_from_env(suffix)
+    ENV.fetch("JANITOR_EXCLUDE_#{suffix.upcase}", '').split
+  end
+end