Commit b8ce03a6 authored by Mayra Cabrera's avatar Mayra Cabrera

Merge branch '218424-migration-helper-to-sync-partitioned-tables' into 'master'

Migration helper to sync trigger partitioned tables

See merge request gitlab-org/gitlab!32884
parents 8e98c110 b3879f74
...@@ -79,11 +79,7 @@ module Gitlab ...@@ -79,11 +79,7 @@ module Gitlab
end end
def update_foreign_keys(from_table, to_table, from_column, to_column, cascade_delete = nil) def update_foreign_keys(from_table, to_table, from_column, to_column, cascade_delete = nil)
if transaction_open? assert_not_in_transaction_block(scope: 'partitioned foreign key')
raise 'partitioned foreign key operations can not be run inside a transaction block, ' \
'you can disable transaction blocks by calling disable_ddl_transaction! ' \
'in the body of your migration class'
end
from_column ||= "#{to_table.to_s.singularize}_id" from_column ||= "#{to_table.to_s.singularize}_id"
specified_key = fk_from_spec(from_table, to_table, from_column, to_column, cascade_delete) specified_key = fk_from_spec(from_table, to_table, from_column, to_column, cascade_delete)
...@@ -103,7 +99,7 @@ module Gitlab ...@@ -103,7 +99,7 @@ module Gitlab
drop_function(fn_name, if_exists: true) drop_function(fn_name, if_exists: true)
else else
create_or_replace_fk_function(fn_name, final_keys) create_or_replace_fk_function(fn_name, final_keys)
create_function_trigger(trigger_name, fn_name, fires: "AFTER DELETE ON #{to_table}") create_trigger(trigger_name, fn_name, fires: "AFTER DELETE ON #{to_table}")
end end
end end
end end
...@@ -116,13 +112,6 @@ module Gitlab ...@@ -116,13 +112,6 @@ module Gitlab
end end
end end
def with_lock_retries(&block)
Gitlab::Database::WithLockRetries.new({
klass: self.class,
logger: Gitlab::BackgroundMigration::Logger
}).run(&block)
end
def find_existing_key(keys, key) def find_existing_key(keys, key)
keys.find { |k| k.from_table == key.from_table && k.from_column == key.from_column } keys.find { |k| k.from_table == key.from_table && k.from_column == key.from_column }
end end
......
...@@ -4,7 +4,10 @@ module Gitlab ...@@ -4,7 +4,10 @@ module Gitlab
module Database module Database
module PartitioningMigrationHelpers module PartitioningMigrationHelpers
module TableManagementHelpers module TableManagementHelpers
include SchemaHelpers include ::Gitlab::Database::SchemaHelpers
WHITELISTED_TABLES = %w[audit_events].freeze
ERROR_SCOPE = 'table partitioning'
# Creates a partitioned copy of an existing table, using a RANGE partitioning strategy on a timestamp column. # Creates a partitioned copy of an existing table, using a RANGE partitioning strategy on a timestamp column.
# One partition is created per month between the given `min_date` and `max_date`. # One partition is created per month between the given `min_date` and `max_date`.
...@@ -20,6 +23,9 @@ module Gitlab ...@@ -20,6 +23,9 @@ module Gitlab
# :max_date - a date specifying the upper bounds of the partitioning range # :max_date - a date specifying the upper bounds of the partitioning range
# #
def partition_table_by_date(table_name, column_name, min_date:, max_date:) def partition_table_by_date(table_name, column_name, min_date:, max_date:)
assert_table_is_whitelisted(table_name)
assert_not_in_transaction_block(scope: ERROR_SCOPE)
raise "max_date #{max_date} must be greater than min_date #{min_date}" if min_date >= max_date raise "max_date #{max_date} must be greater than min_date #{min_date}" if min_date >= max_date
primary_key = connection.primary_key(table_name) primary_key = connection.primary_key(table_name)
...@@ -31,6 +37,7 @@ module Gitlab ...@@ -31,6 +37,7 @@ module Gitlab
new_table_name = partitioned_table_name(table_name) new_table_name = partitioned_table_name(table_name)
create_range_partitioned_copy(new_table_name, table_name, partition_column, primary_key) create_range_partitioned_copy(new_table_name, table_name, partition_column, primary_key)
create_daterange_partitions(new_table_name, partition_column.name, min_date, max_date) create_daterange_partitions(new_table_name, partition_column.name, min_date, max_date)
create_sync_trigger(table_name, new_table_name, primary_key)
end end
# Clean up a partitioned copy of an existing table. This deletes the partitioned table and all partitions. # Clean up a partitioned copy of an existing table. This deletes the partitioned table and all partitions.
...@@ -40,22 +47,57 @@ module Gitlab ...@@ -40,22 +47,57 @@ module Gitlab
# drop_partitioned_table_for :audit_events # drop_partitioned_table_for :audit_events
# #
def drop_partitioned_table_for(table_name) def drop_partitioned_table_for(table_name)
drop_table(partitioned_table_name(table_name)) assert_table_is_whitelisted(table_name)
assert_not_in_transaction_block(scope: ERROR_SCOPE)
with_lock_retries do
trigger_name = sync_trigger_name(table_name)
drop_trigger(table_name, trigger_name)
end
function_name = sync_function_name(table_name)
drop_function(function_name)
part_table_name = partitioned_table_name(table_name)
drop_table(part_table_name)
end end
private private
def assert_table_is_whitelisted(table_name)
return if WHITELISTED_TABLES.include?(table_name.to_s)
raise "partitioning helpers are in active development, and #{table_name} is not whitelisted for use, " \
"for more information please contact the database team"
end
def partitioned_table_name(table) def partitioned_table_name(table)
tmp_table_name("#{table}_part") tmp_table_name("#{table}_part")
end end
def sync_function_name(table)
object_name(table, 'table_sync_function')
end
def sync_trigger_name(table)
object_name(table, 'table_sync_trigger')
end
def find_column_definition(table, column) def find_column_definition(table, column)
connection.columns(table).find { |c| c.name == column.to_s } connection.columns(table).find { |c| c.name == column.to_s }
end end
def create_range_partitioned_copy(table_name, template_table_name, partition_column, primary_key) def create_range_partitioned_copy(table_name, template_table_name, partition_column, primary_key)
tmp_column_name = object_name(partition_column.name, 'partition_key') if table_exists?(table_name)
# rubocop:disable Gitlab/RailsLogger
Rails.logger.warn "Partitioned table not created because it already exists" \
" (this may be due to an aborted migration or similar): table_name: #{table_name} "
# rubocop:enable Gitlab/RailsLogger
return
end
tmp_column_name = object_name(partition_column.name, 'partition_key')
transaction do
execute(<<~SQL) execute(<<~SQL)
CREATE TABLE #{table_name} ( CREATE TABLE #{table_name} (
LIKE #{template_table_name} INCLUDING ALL EXCLUDING INDEXES, LIKE #{template_table_name} INCLUDING ALL EXCLUDING INDEXES,
...@@ -68,12 +110,13 @@ module Gitlab ...@@ -68,12 +110,13 @@ module Gitlab
rename_column(table_name, tmp_column_name, partition_column.name) rename_column(table_name, tmp_column_name, partition_column.name)
change_column_default(table_name, primary_key, nil) change_column_default(table_name, primary_key, nil)
end end
end
def create_daterange_partitions(table_name, column_name, min_date, max_date) def create_daterange_partitions(table_name, column_name, min_date, max_date)
min_date = min_date.beginning_of_month.to_date min_date = min_date.beginning_of_month.to_date
max_date = max_date.next_month.beginning_of_month.to_date max_date = max_date.next_month.beginning_of_month.to_date
create_range_partition("#{table_name}_000000", table_name, 'MINVALUE', to_sql_date_literal(min_date)) create_range_partition_safely("#{table_name}_000000", table_name, 'MINVALUE', to_sql_date_literal(min_date))
while min_date < max_date while min_date < max_date
partition_name = "#{table_name}_#{min_date.strftime('%Y%m')}" partition_name = "#{table_name}_#{min_date.strftime('%Y%m')}"
...@@ -81,7 +124,7 @@ module Gitlab ...@@ -81,7 +124,7 @@ module Gitlab
lower_bound = to_sql_date_literal(min_date) lower_bound = to_sql_date_literal(min_date)
upper_bound = to_sql_date_literal(next_date) upper_bound = to_sql_date_literal(next_date)
create_range_partition(partition_name, table_name, lower_bound, upper_bound) create_range_partition_safely(partition_name, table_name, lower_bound, upper_bound)
min_date = next_date min_date = next_date
end end
end end
...@@ -90,13 +133,57 @@ module Gitlab ...@@ -90,13 +133,57 @@ module Gitlab
connection.quote(date.strftime('%Y-%m-%d')) connection.quote(date.strftime('%Y-%m-%d'))
end end
def create_range_partition(partition_name, table_name, lower_bound, upper_bound) def create_range_partition_safely(partition_name, table_name, lower_bound, upper_bound)
execute(<<~SQL) if table_exists?(partition_name)
CREATE TABLE #{partition_name} PARTITION OF #{table_name} # rubocop:disable Gitlab/RailsLogger
FOR VALUES FROM (#{lower_bound}) TO (#{upper_bound}) Rails.logger.warn "Partition not created because it already exists" \
" (this may be due to an aborted migration or similar): partition_name: #{partition_name}"
# rubocop:enable Gitlab/RailsLogger
return
end
create_range_partition(partition_name, table_name, lower_bound, upper_bound)
end
def create_sync_trigger(source_table, target_table, unique_key)
function_name = sync_function_name(source_table)
trigger_name = sync_trigger_name(source_table)
with_lock_retries do
create_sync_function(function_name, target_table, unique_key)
create_comment('FUNCTION', function_name, "Partitioning migration: table sync for #{source_table} table")
create_trigger(trigger_name, function_name, fires: "AFTER INSERT OR UPDATE OR DELETE ON #{source_table}")
end
end
def create_sync_function(name, target_table, unique_key)
delimiter = ",\n "
column_names = connection.columns(target_table).map(&:name)
set_statements = build_set_statements(column_names, unique_key)
insert_values = column_names.map { |name| "NEW.#{name}" }
create_trigger_function(name, replace: false) do
<<~SQL
IF (TG_OP = 'DELETE') THEN
DELETE FROM #{target_table} where #{unique_key} = OLD.#{unique_key};
ELSIF (TG_OP = 'UPDATE') THEN
UPDATE #{target_table}
SET #{set_statements.join(delimiter)}
WHERE #{target_table}.#{unique_key} = NEW.#{unique_key};
ELSIF (TG_OP = 'INSERT') THEN
INSERT INTO #{target_table} (#{column_names.join(delimiter)})
VALUES (#{insert_values.join(delimiter)});
END IF;
RETURN NULL;
SQL SQL
end end
end end
def build_set_statements(column_names, unique_key)
column_names.reject { |name| name == unique_key }.map { |column_name| "#{column_name} = NEW.#{column_name}" }
end
end
end end
end end
end end
...@@ -16,12 +16,12 @@ module Gitlab ...@@ -16,12 +16,12 @@ module Gitlab
SQL SQL
end end
def create_function_trigger(name, fn_name, fires: nil) def create_trigger(name, function_name, fires: nil)
execute(<<~SQL) execute(<<~SQL)
CREATE TRIGGER #{name} CREATE TRIGGER #{name}
#{fires} #{fires}
FOR EACH ROW FOR EACH ROW
EXECUTE PROCEDURE #{fn_name}() EXECUTE PROCEDURE #{function_name}()
SQL SQL
end end
...@@ -35,6 +35,10 @@ module Gitlab ...@@ -35,6 +35,10 @@ module Gitlab
execute("DROP TRIGGER #{exists_clause} #{name} ON #{table_name}") execute("DROP TRIGGER #{exists_clause} #{name} ON #{table_name}")
end end
def create_comment(type, name, text)
execute("COMMENT ON #{type} #{name} IS '#{text}'")
end
def tmp_table_name(base) def tmp_table_name(base)
hashed_base = Digest::SHA256.hexdigest(base).first(10) hashed_base = Digest::SHA256.hexdigest(base).first(10)
...@@ -48,8 +52,30 @@ module Gitlab ...@@ -48,8 +52,30 @@ module Gitlab
"#{type}_#{hashed_identifier}" "#{type}_#{hashed_identifier}"
end end
def with_lock_retries(&block)
Gitlab::Database::WithLockRetries.new({
klass: self.class,
logger: Gitlab::BackgroundMigration::Logger
}).run(&block)
end
def assert_not_in_transaction_block(scope:)
return unless transaction_open?
raise "#{scope} operations can not be run inside a transaction block, " \
"you can disable transaction blocks by calling disable_ddl_transaction! " \
"in the body of your migration class"
end
private private
def create_range_partition(partition_name, table_name, lower_bound, upper_bound)
execute(<<~SQL)
CREATE TABLE #{partition_name} PARTITION OF #{table_name}
FOR VALUES FROM (#{lower_bound}) TO (#{upper_bound})
SQL
end
def optional_clause(flag, clause) def optional_clause(flag, clause)
flag ? clause : "" flag ? clause : ""
end end
......
...@@ -3,6 +3,8 @@ ...@@ -3,6 +3,8 @@
require 'spec_helper' require 'spec_helper'
describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do
include TriggerHelpers
let(:model) do let(:model) do
ActiveRecord::Migration.new.extend(described_class) ActiveRecord::Migration.new.extend(described_class)
end end
...@@ -27,7 +29,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do ...@@ -27,7 +29,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do
model.add_partitioned_foreign_key :issue_assignees, referenced_table model.add_partitioned_foreign_key :issue_assignees, referenced_table
expect_function_to_contain(function_name, 'delete from issue_assignees where issue_id = old.id') expect_function_to_contain(function_name, 'delete from issue_assignees where issue_id = old.id')
expect_valid_function_trigger(trigger_name, function_name) expect_valid_function_trigger(referenced_table, trigger_name, function_name, after: 'delete')
end end
end end
...@@ -43,7 +45,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do ...@@ -43,7 +45,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do
expect_function_to_contain(function_name, expect_function_to_contain(function_name,
'delete from issue_assignees where issue_id = old.id', 'delete from issue_assignees where issue_id = old.id',
'delete from epic_issues where issue_id = old.id') 'delete from epic_issues where issue_id = old.id')
expect_valid_function_trigger(trigger_name, function_name) expect_valid_function_trigger(referenced_table, trigger_name, function_name, after: 'delete')
end end
end end
...@@ -59,7 +61,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do ...@@ -59,7 +61,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do
expect_function_to_contain(function_name, expect_function_to_contain(function_name,
'delete from issues where moved_to_id = old.id', 'delete from issues where moved_to_id = old.id',
'delete from issues where duplicated_to_id = old.id') 'delete from issues where duplicated_to_id = old.id')
expect_valid_function_trigger(trigger_name, function_name) expect_valid_function_trigger(referenced_table, trigger_name, function_name, after: 'delete')
end end
end end
...@@ -68,7 +70,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do ...@@ -68,7 +70,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do
model.add_partitioned_foreign_key :issues, referenced_table, column: :moved_to_id model.add_partitioned_foreign_key :issues, referenced_table, column: :moved_to_id
expect_function_to_contain(function_name, 'delete from issues where moved_to_id = old.id') expect_function_to_contain(function_name, 'delete from issues where moved_to_id = old.id')
expect_valid_function_trigger(trigger_name, function_name) expect_valid_function_trigger(referenced_table, trigger_name, function_name, after: 'delete')
end end
end end
end end
...@@ -79,7 +81,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do ...@@ -79,7 +81,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do
model.add_partitioned_foreign_key :issue_assignees, referenced_table, on_delete: :nullify model.add_partitioned_foreign_key :issue_assignees, referenced_table, on_delete: :nullify
expect_function_to_contain(function_name, 'update issue_assignees set issue_id = null where issue_id = old.id') expect_function_to_contain(function_name, 'update issue_assignees set issue_id = null where issue_id = old.id')
expect_valid_function_trigger(trigger_name, function_name) expect_valid_function_trigger(referenced_table, trigger_name, function_name, after: 'delete')
end end
end end
...@@ -88,7 +90,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do ...@@ -88,7 +90,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do
model.add_partitioned_foreign_key :issues, referenced_table, column: :duplicated_to_id model.add_partitioned_foreign_key :issues, referenced_table, column: :duplicated_to_id
expect_function_to_contain(function_name, 'delete from issues where duplicated_to_id = old.id') expect_function_to_contain(function_name, 'delete from issues where duplicated_to_id = old.id')
expect_valid_function_trigger(trigger_name, function_name) expect_valid_function_trigger(referenced_table, trigger_name, function_name, after: 'delete')
end end
end end
...@@ -99,7 +101,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do ...@@ -99,7 +101,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do
model.add_partitioned_foreign_key :user_preferences, referenced_table, column: :user_id, primary_key: :user_id model.add_partitioned_foreign_key :user_preferences, referenced_table, column: :user_id, primary_key: :user_id
expect_function_to_contain(function_name, 'delete from user_preferences where user_id = old.user_id') expect_function_to_contain(function_name, 'delete from user_preferences where user_id = old.user_id')
expect_valid_function_trigger(trigger_name, function_name) expect_valid_function_trigger(referenced_table, trigger_name, function_name, after: 'delete')
end end
end end
...@@ -137,12 +139,12 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do ...@@ -137,12 +139,12 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do
expect_function_to_contain(function_name, expect_function_to_contain(function_name,
'delete from issue_assignees where issue_id = old.id', 'delete from issue_assignees where issue_id = old.id',
'delete from epic_issues where issue_id = old.id') 'delete from epic_issues where issue_id = old.id')
expect_valid_function_trigger(trigger_name, function_name) expect_valid_function_trigger(referenced_table, trigger_name, function_name, after: 'delete')
model.remove_partitioned_foreign_key :issue_assignees, referenced_table model.remove_partitioned_foreign_key :issue_assignees, referenced_table
expect_function_to_contain(function_name, 'delete from epic_issues where issue_id = old.id') expect_function_to_contain(function_name, 'delete from epic_issues where issue_id = old.id')
expect_valid_function_trigger(trigger_name, function_name) expect_valid_function_trigger(referenced_table, trigger_name, function_name, after: 'delete')
end end
end end
...@@ -153,12 +155,12 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do ...@@ -153,12 +155,12 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do
it 'removes the trigger function altogether' do it 'removes the trigger function altogether' do
expect_function_to_contain(function_name, 'delete from issue_assignees where issue_id = old.id') expect_function_to_contain(function_name, 'delete from issue_assignees where issue_id = old.id')
expect_valid_function_trigger(trigger_name, function_name) expect_valid_function_trigger(referenced_table, trigger_name, function_name, after: 'delete')
model.remove_partitioned_foreign_key :issue_assignees, referenced_table model.remove_partitioned_foreign_key :issue_assignees, referenced_table
expect(find_function_def(function_name)).to be_nil expect_function_not_to_exist(function_name)
expect(find_trigger_def(trigger_name)).to be_nil expect_trigger_not_to_exist(referenced_table, trigger_name)
end end
end end
...@@ -169,12 +171,12 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do ...@@ -169,12 +171,12 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do
it 'ignores the invalid key and properly recreates the trigger function' do it 'ignores the invalid key and properly recreates the trigger function' do
expect_function_to_contain(function_name, 'delete from issue_assignees where issue_id = old.id') expect_function_to_contain(function_name, 'delete from issue_assignees where issue_id = old.id')
expect_valid_function_trigger(trigger_name, function_name) expect_valid_function_trigger(referenced_table, trigger_name, function_name, after: 'delete')
model.remove_partitioned_foreign_key :issues, referenced_table, column: :moved_to_id model.remove_partitioned_foreign_key :issues, referenced_table, column: :moved_to_id
expect_function_to_contain(function_name, 'delete from issue_assignees where issue_id = old.id') expect_function_to_contain(function_name, 'delete from issue_assignees where issue_id = old.id')
expect_valid_function_trigger(trigger_name, function_name) expect_valid_function_trigger(referenced_table, trigger_name, function_name, after: 'delete')
end end
end end
...@@ -188,45 +190,4 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do ...@@ -188,45 +190,4 @@ describe Gitlab::Database::PartitioningMigrationHelpers::ForeignKeyHelpers do
end end
end end
end end
def expect_function_to_contain(name, *statements)
return_stmt, *body_stmts = parsed_function_statements(name).reverse
expect(return_stmt).to eq('return old')
expect(body_stmts).to contain_exactly(*statements)
end
def expect_valid_function_trigger(name, fn_name)
event, activation, definition = cleaned_trigger_def(name)
expect(event).to eq('delete')
expect(activation).to eq('after')
expect(definition).to eq("execute procedure #{fn_name}()")
end
def parsed_function_statements(name)
cleaned_definition = find_function_def(name)['fn_body'].downcase.gsub(/\s+/, ' ')
statements = cleaned_definition.sub(/\A\s*begin\s*(.*)\s*end\s*\Z/, "\\1")
statements.split(';').map! { |stmt| stmt.strip.presence }.compact!
end
def find_function_def(name)
connection.execute("select prosrc as fn_body from pg_proc where proname = '#{name}';").first
end
def cleaned_trigger_def(name)
find_trigger_def(name).values_at('event', 'activation', 'definition').map!(&:downcase)
end
def find_trigger_def(name)
connection.execute(<<~SQL).first
select
string_agg(event_manipulation, ',') as event,
action_timing as activation,
action_statement as definition
from information_schema.triggers
where trigger_name = '#{name}'
group by 2, 3
SQL
end
end end
...@@ -4,33 +4,63 @@ require 'spec_helper' ...@@ -4,33 +4,63 @@ require 'spec_helper'
describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers do describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers do
include PartitioningHelpers include PartitioningHelpers
include TriggerHelpers
let(:model) do let(:migration) do
ActiveRecord::Migration.new.extend(described_class) ActiveRecord::Migration.new.extend(described_class)
end end
let_it_be(:connection) { ActiveRecord::Base.connection } let_it_be(:connection) { ActiveRecord::Base.connection }
let(:template_table) { :audit_events } let(:template_table) { :audit_events }
let(:partitioned_table) { '_test_migration_partitioned_table' } let(:partitioned_table) { '_test_migration_partitioned_table' }
let(:function_name) { '_test_migration_function_name' }
let(:trigger_name) { '_test_migration_trigger_name' }
let(:partition_column) { 'created_at' } let(:partition_column) { 'created_at' }
let(:min_date) { Date.new(2019, 12) } let(:min_date) { Date.new(2019, 12) }
let(:max_date) { Date.new(2020, 3) } let(:max_date) { Date.new(2020, 3) }
before do before do
allow(model).to receive(:puts) allow(migration).to receive(:puts)
allow(model).to receive(:partitioned_table_name).and_return(partitioned_table) allow(migration).to receive(:transaction_open?).and_return(false)
allow(migration).to receive(:partitioned_table_name).and_return(partitioned_table)
allow(migration).to receive(:sync_function_name).and_return(function_name)
allow(migration).to receive(:sync_trigger_name).and_return(trigger_name)
allow(migration).to receive(:assert_table_is_whitelisted)
end end
describe '#partition_table_by_date' do describe '#partition_table_by_date' do
let(:partition_column) { 'created_at' }
let(:old_primary_key) { 'id' } let(:old_primary_key) { 'id' }
let(:new_primary_key) { [old_primary_key, partition_column] } let(:new_primary_key) { [old_primary_key, partition_column] }
context 'when the table is not whitelisted' do
let(:template_table) { :this_table_is_not_whitelisted }
it 'raises an error' do
expect(migration).to receive(:assert_table_is_whitelisted).with(template_table).and_call_original
expect do
migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
end.to raise_error(/#{template_table} is not whitelisted for use/)
end
end
context 'when run inside a transaction block' do
it 'raises an error' do
expect(migration).to receive(:transaction_open?).and_return(true)
expect do
migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
end.to raise_error(/can not be run inside a transaction/)
end
end
context 'when the the max_date is less than the min_date' do context 'when the the max_date is less than the min_date' do
let(:max_date) { Time.utc(2019, 6) } let(:max_date) { Time.utc(2019, 6) }
it 'raises an error' do it 'raises an error' do
expect do expect do
model.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
end.to raise_error(/max_date #{max_date} must be greater than min_date #{min_date}/) end.to raise_error(/max_date #{max_date} must be greater than min_date #{min_date}/)
end end
end end
...@@ -40,7 +70,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers ...@@ -40,7 +70,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers
it 'raises an error' do it 'raises an error' do
expect do expect do
model.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
end.to raise_error(/max_date #{max_date} must be greater than min_date #{min_date}/) end.to raise_error(/max_date #{max_date} must be greater than min_date #{min_date}/)
end end
end end
...@@ -50,13 +80,13 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers ...@@ -50,13 +80,13 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers
let(:partition_column) { :some_field } let(:partition_column) { :some_field }
it 'raises an error' do it 'raises an error' do
model.create_table template_table, id: false do |t| migration.create_table template_table, id: false do |t|
t.integer :id t.integer :id
t.datetime partition_column t.datetime partition_column
end end
expect do expect do
model.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
end.to raise_error(/primary key not defined for #{template_table}/) end.to raise_error(/primary key not defined for #{template_table}/)
end end
end end
...@@ -66,14 +96,14 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers ...@@ -66,14 +96,14 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers
it 'raises an error' do it 'raises an error' do
expect do expect do
model.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
end.to raise_error(/partition column #{partition_column} does not exist/) end.to raise_error(/partition column #{partition_column} does not exist/)
end end
end end
context 'when a valid source table and partition column is given' do describe 'constructing the partitioned table' do
it 'creates a table partitioned by the proper column' do it 'creates a table partitioned by the proper column' do
model.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
expect(connection.table_exists?(partitioned_table)).to be(true) expect(connection.table_exists?(partitioned_table)).to be(true)
expect(connection.primary_key(partitioned_table)).to eq(new_primary_key) expect(connection.primary_key(partitioned_table)).to eq(new_primary_key)
...@@ -82,7 +112,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers ...@@ -82,7 +112,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers
end end
it 'removes the default from the primary key column' do it 'removes the default from the primary key column' do
model.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
pk_column = connection.columns(partitioned_table).find { |c| c.name == old_primary_key } pk_column = connection.columns(partitioned_table).find { |c| c.name == old_primary_key }
...@@ -90,7 +120,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers ...@@ -90,7 +120,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers
end end
it 'creates the partitioned table with the same non-key columns' do it 'creates the partitioned table with the same non-key columns' do
model.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
copied_columns = filter_columns_by_name(connection.columns(partitioned_table), new_primary_key) copied_columns = filter_columns_by_name(connection.columns(partitioned_table), new_primary_key)
original_columns = filter_columns_by_name(connection.columns(template_table), new_primary_key) original_columns = filter_columns_by_name(connection.columns(template_table), new_primary_key)
...@@ -99,7 +129,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers ...@@ -99,7 +129,7 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers
end end
it 'creates a partition spanning over each month in the range given' do it 'creates a partition spanning over each month in the range given' do
model.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
expect_range_partition_of("#{partitioned_table}_000000", partitioned_table, 'MINVALUE', "'2019-12-01 00:00:00'") expect_range_partition_of("#{partitioned_table}_000000", partitioned_table, 'MINVALUE', "'2019-12-01 00:00:00'")
expect_range_partition_of("#{partitioned_table}_201912", partitioned_table, "'2019-12-01 00:00:00'", "'2020-01-01 00:00:00'") expect_range_partition_of("#{partitioned_table}_201912", partitioned_table, "'2019-12-01 00:00:00'", "'2020-01-01 00:00:00'")
...@@ -107,6 +137,76 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers ...@@ -107,6 +137,76 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers
expect_range_partition_of("#{partitioned_table}_202002", partitioned_table, "'2020-02-01 00:00:00'", "'2020-03-01 00:00:00'") expect_range_partition_of("#{partitioned_table}_202002", partitioned_table, "'2020-02-01 00:00:00'", "'2020-03-01 00:00:00'")
end end
end end
describe 'keeping data in sync with the partitioned table' do
let(:template_table) { :todos }
let(:model) { Class.new(ActiveRecord::Base) }
let(:timestamp) { Time.utc(2019, 12, 1, 12).round }
before do
model.primary_key = :id
model.table_name = partitioned_table
end
it 'creates a trigger function on the original table' do
expect_function_not_to_exist(function_name)
expect_trigger_not_to_exist(template_table, trigger_name)
migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
expect_function_to_exist(function_name)
expect_valid_function_trigger(template_table, trigger_name, function_name, after: %w[delete insert update])
end
it 'syncs inserts to the partitioned tables' do
migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
expect(model.count).to eq(0)
first_todo = create(:todo, created_at: timestamp, updated_at: timestamp)
second_todo = create(:todo, created_at: timestamp, updated_at: timestamp)
expect(model.count).to eq(2)
expect(model.find(first_todo.id).attributes).to eq(first_todo.attributes)
expect(model.find(second_todo.id).attributes).to eq(second_todo.attributes)
end
it 'syncs updates to the partitioned tables' do
migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
first_todo = create(:todo, :pending, commit_id: nil, created_at: timestamp, updated_at: timestamp)
second_todo = create(:todo, created_at: timestamp, updated_at: timestamp)
expect(model.count).to eq(2)
first_copy = model.find(first_todo.id)
second_copy = model.find(second_todo.id)
expect(first_copy.attributes).to eq(first_todo.attributes)
expect(second_copy.attributes).to eq(second_todo.attributes)
first_todo.update(state_event: 'done', commit_id: 'abc123', updated_at: timestamp + 1.second)
expect(model.count).to eq(2)
expect(first_copy.reload.attributes).to eq(first_todo.attributes)
expect(second_copy.reload.attributes).to eq(second_todo.attributes)
end
it 'syncs deletes to the partitioned tables' do
migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
first_todo = create(:todo, created_at: timestamp, updated_at: timestamp)
second_todo = create(:todo, created_at: timestamp, updated_at: timestamp)
expect(model.count).to eq(2)
first_todo.destroy
expect(model.count).to eq(1)
expect(model.find_by_id(first_todo.id)).to be_nil
expect(model.find(second_todo.id).attributes).to eq(second_todo.attributes)
end
end
end end
describe '#drop_partitioned_table_for' do describe '#drop_partitioned_table_for' do
...@@ -114,14 +214,38 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers ...@@ -114,14 +214,38 @@ describe Gitlab::Database::PartitioningMigrationHelpers::TableManagementHelpers
%w[000000 201912 202001 202002].map { |suffix| "#{partitioned_table}_#{suffix}" }.unshift(partitioned_table) %w[000000 201912 202001 202002].map { |suffix| "#{partitioned_table}_#{suffix}" }.unshift(partitioned_table)
end end
context 'when the table is not whitelisted' do
let(:template_table) { :this_table_is_not_whitelisted }
it 'raises an error' do
expect(migration).to receive(:assert_table_is_whitelisted).with(template_table).and_call_original
expect do
migration.drop_partitioned_table_for template_table
end.to raise_error(/#{template_table} is not whitelisted for use/)
end
end
it 'drops the trigger syncing to the partitioned table' do
migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
expect_function_to_exist(function_name)
expect_valid_function_trigger(template_table, trigger_name, function_name, after: %w[delete insert update])
migration.drop_partitioned_table_for template_table
expect_function_not_to_exist(function_name)
expect_trigger_not_to_exist(template_table, trigger_name)
end
it 'drops the partitioned copy and all partitions' do it 'drops the partitioned copy and all partitions' do
model.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date migration.partition_table_by_date template_table, partition_column, min_date: min_date, max_date: max_date
expected_tables.each do |table| expected_tables.each do |table|
expect(connection.table_exists?(table)).to be(true) expect(connection.table_exists?(table)).to be(true)
end end
model.drop_partitioned_table_for template_table migration.drop_partitioned_table_for template_table
expected_tables.each do |table| expected_tables.each do |table|
expect(connection.table_exists?(table)).to be(false) expect(connection.table_exists?(table)).to be(false)
......
# frozen_string_literal: true
module TriggerHelpers
def expect_function_to_exist(name)
expect(find_function_def(name)).not_to be_nil
end
def expect_function_not_to_exist(name)
expect(find_function_def(name)).to be_nil
end
def expect_function_to_contain(name, *statements)
return_stmt, *body_stmts = parsed_function_statements(name).reverse
expect(return_stmt).to eq('return old')
expect(body_stmts).to contain_exactly(*statements)
end
def expect_trigger_not_to_exist(table_name, name)
expect(find_trigger_def(table_name, name)).to be_nil
end
def expect_valid_function_trigger(table_name, name, fn_name, fires_on)
events, timing, definition = cleaned_trigger_def(table_name, name)
events = events&.split(',')
expected_timing, expected_events = fires_on.first
expect(timing).to eq(expected_timing.to_s)
expect(events).to match_array(Array.wrap(expected_events))
expect(definition).to eq("execute procedure #{fn_name}()")
end
private
def parsed_function_statements(name)
cleaned_definition = find_function_def(name)['body'].downcase.gsub(/\s+/, ' ')
statements = cleaned_definition.sub(/\A\s*begin\s*(.*)\s*end\s*\Z/, "\\1")
statements.split(';').map! { |stmt| stmt.strip.presence }.compact!
end
def find_function_def(name)
connection.select_one(<<~SQL)
SELECT prosrc AS body
FROM pg_proc
WHERE proname = '#{name}'
SQL
end
def cleaned_trigger_def(table_name, name)
find_trigger_def(table_name, name).values_at('event', 'action_timing', 'action_statement').map!(&:downcase)
end
def find_trigger_def(table_name, name)
connection.select_one(<<~SQL)
SELECT
string_agg(event_manipulation, ',') AS event,
action_timing,
action_statement
FROM information_schema.triggers
WHERE event_object_table = '#{table_name}'
AND trigger_name = '#{name}'
GROUP BY 2, 3
SQL
end
end
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment