Commit 47e38bbf authored by Adam Hegyi's avatar Adam Hegyi

Multi DB support for loose foreign keys

This change adds multi-db support for loose foreign key deleted records
table.
parent 8487fa04
# frozen_string_literal: true # frozen_string_literal: true
class LooseForeignKeys::DeletedRecord < ApplicationRecord class LooseForeignKeys::DeletedRecord < Gitlab::Database::SharedModel
PARTITION_DURATION = 1.day PARTITION_DURATION = 1.day
include PartitionedTable include PartitionedTable
......
...@@ -4,7 +4,7 @@ module LooseForeignKeys ...@@ -4,7 +4,7 @@ module LooseForeignKeys
class ModificationTracker class ModificationTracker
MAX_DELETES = 100_000 MAX_DELETES = 100_000
MAX_UPDATES = 50_000 MAX_UPDATES = 50_000
MAX_RUNTIME = 3.minutes MAX_RUNTIME = 30.seconds # must be less than the scheduling frequency of the LooseForeignKeys::CleanupWorker cron worker
delegate :monotonic_time, to: :'Gitlab::Metrics::System' delegate :monotonic_time, to: :'Gitlab::Metrics::System'
......
...@@ -10,7 +10,6 @@ module LooseForeignKeys ...@@ -10,7 +10,6 @@ module LooseForeignKeys
def execute def execute
modification_tracker = ModificationTracker.new modification_tracker = ModificationTracker.new
tracked_tables.cycle do |table| tracked_tables.cycle do |table|
records = load_batch_for_table(table) records = load_batch_for_table(table)
......
...@@ -6,6 +6,7 @@ module LooseForeignKeys ...@@ -6,6 +6,7 @@ module LooseForeignKeys
include Gitlab::ExclusiveLeaseHelpers include Gitlab::ExclusiveLeaseHelpers
include CronjobQueue # rubocop: disable Scalability/CronWorkerContext include CronjobQueue # rubocop: disable Scalability/CronWorkerContext
sidekiq_options retry: false
feature_category :sharding feature_category :sharding
data_consistency :always data_consistency :always
idempotent! idempotent!
...@@ -13,13 +14,30 @@ module LooseForeignKeys ...@@ -13,13 +14,30 @@ module LooseForeignKeys
def perform def perform
return if Feature.disabled?(:loose_foreign_key_cleanup, default_enabled: :yaml) return if Feature.disabled?(:loose_foreign_key_cleanup, default_enabled: :yaml)
ttl = ModificationTracker::MAX_RUNTIME + 1.minute in_lock(self.class.name.underscore, ttl: ModificationTracker::MAX_RUNTIME, retries: 0) do
in_lock(self.class.name.underscore, ttl: ttl, retries: 0) do stats = {}
# TODO: Iterate over the connections
# https://gitlab.com/gitlab-org/gitlab/-/issues/341513 connection_name, base_model = current_connection_name_and_base_model
stats = ProcessDeletedRecordsService.new(connection: ApplicationRecord.connection).execute
Gitlab::Database::SharedModel.using_connection(base_model.connection) do
stats = ProcessDeletedRecordsService.new(connection: base_model.connection).execute
stats[:connection] = connection_name
end
log_extra_metadata_on_done(:stats, stats) log_extra_metadata_on_done(:stats, stats)
end end
end end
private
# Rotate the databases every minute
#
# If one DB is configured: every minute use the configured DB
# If two DBs are configured (Main, CI): minute 1 -> Main, minute 2 -> CI
def current_connection_name_and_base_model
minutes_since_epoch = Time.current.to_i / 60
connections_with_name = Gitlab::Database.database_base_models.to_a # this will never be empty
connections_with_name[minutes_since_epoch % connections_with_name.count]
end
end end
end end
...@@ -735,7 +735,7 @@ Gitlab.ee do ...@@ -735,7 +735,7 @@ Gitlab.ee do
Settings.cron_jobs['app_sec_dast_profile_schedule_worker']['cron'] ||= '7-59/15 * * * *' Settings.cron_jobs['app_sec_dast_profile_schedule_worker']['cron'] ||= '7-59/15 * * * *'
Settings.cron_jobs['app_sec_dast_profile_schedule_worker']['job_class'] = 'AppSec::Dast::ProfileScheduleWorker' Settings.cron_jobs['app_sec_dast_profile_schedule_worker']['job_class'] = 'AppSec::Dast::ProfileScheduleWorker'
Settings.cron_jobs['loose_foreign_keys_cleanup_worker'] ||= Settingslogic.new({}) Settings.cron_jobs['loose_foreign_keys_cleanup_worker'] ||= Settingslogic.new({})
Settings.cron_jobs['loose_foreign_keys_cleanup_worker']['cron'] ||= '*/5 * * * *' Settings.cron_jobs['loose_foreign_keys_cleanup_worker']['cron'] ||= '*/1 * * * *'
Settings.cron_jobs['loose_foreign_keys_cleanup_worker']['job_class'] = 'LooseForeignKeys::CleanupWorker' Settings.cron_jobs['loose_foreign_keys_cleanup_worker']['job_class'] = 'LooseForeignKeys::CleanupWorker'
end end
......
...@@ -43,7 +43,7 @@ we can: ...@@ -43,7 +43,7 @@ we can:
1. Create a `DELETE` trigger on the `projects` table. 1. Create a `DELETE` trigger on the `projects` table.
Record the deletions in a separate table (`deleted_records`). Record the deletions in a separate table (`deleted_records`).
1. A job checks the `deleted_records` table every 5 minutes. 1. A job checks the `deleted_records` table every minute or two.
1. For each record in the table, delete the associated `ci_pipelines` records 1. For each record in the table, delete the associated `ci_pipelines` records
using the `project_id` column. using the `project_id` column.
......
...@@ -4,6 +4,7 @@ require 'spec_helper' ...@@ -4,6 +4,7 @@ require 'spec_helper'
RSpec.describe LooseForeignKeys::CleanupWorker do RSpec.describe LooseForeignKeys::CleanupWorker do
include MigrationsHelpers include MigrationsHelpers
using RSpec::Parameterized::TableSyntax
def create_table_structure def create_table_structure
migration = ActiveRecord::Migration.new.extend(Gitlab::Database::MigrationHelpers::LooseForeignKeyHelpers) migration = ActiveRecord::Migration.new.extend(Gitlab::Database::MigrationHelpers::LooseForeignKeyHelpers)
...@@ -149,4 +150,31 @@ RSpec.describe LooseForeignKeys::CleanupWorker do ...@@ -149,4 +150,31 @@ RSpec.describe LooseForeignKeys::CleanupWorker do
expect { described_class.new.perform }.not_to change { LooseForeignKeys::DeletedRecord.status_processed.count } expect { described_class.new.perform }.not_to change { LooseForeignKeys::DeletedRecord.status_processed.count }
end end
end end
describe 'multi-database support' do
where(:current_minute, :configured_base_models, :expected_connection) do
2 | { main: ApplicationRecord, ci: Ci::ApplicationRecord } | ApplicationRecord.connection
3 | { main: ApplicationRecord, ci: Ci::ApplicationRecord } | Ci::ApplicationRecord.connection
2 | { main: ApplicationRecord } | ApplicationRecord.connection
3 | { main: ApplicationRecord } | ApplicationRecord.connection
end
with_them do
before do
allow(Gitlab::Database).to receive(:database_base_models).and_return(configured_base_models)
end
it 'uses the correct connection' do
LooseForeignKeys::DeletedRecord.count.times do
expect_next_found_instance_of(LooseForeignKeys::DeletedRecord) do |instance|
expect(instance.class.connection).to eq(expected_connection)
end
end
travel_to DateTime.new(2019, 1, 1, 10, current_minute) do
described_class.new.perform
end
end
end
end
end end
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment