Commit 860fe038 authored by Mike Kozono's avatar Mike Kozono

Handle concurrent VerificationWorker

And also prevent backfill from working the same record.
parent ef538e9f
...@@ -47,12 +47,26 @@ module Geo ...@@ -47,12 +47,26 @@ module Geo
end end
def verify_async def verify_async
# Marking started prevents backfill (VerificationBatchWorker) from picking
# this up too.
# Also, if another verification job is running, this will make that job
# set state to pending after it finishes, since the calculated checksum
# is already invalidated.
model_record.verification_started!
Geo::VerificationWorker.perform_async(replicable_name, model_record.id) Geo::VerificationWorker.perform_async(replicable_name, model_record.id)
end end
# Calculates checksum and asks the model/registry to update verification
# state.
def verify def verify
# Deduplicate verification job
return unless model_record.verification_started?
calculation_started_at = Time.current
checksum = model_record.calculate_checksum checksum = model_record.calculate_checksum
model_record.verification_succeeded_with_checksum!(checksum)
model_record.verification_succeeded_with_checksum!(checksum, calculation_started_at)
rescue => e rescue => e
model_record.verification_failed_with_message!('Error calculating the checksum', e) model_record.verification_failed_with_message!('Error calculating the checksum', e)
end end
......
...@@ -51,7 +51,6 @@ module Gitlab ...@@ -51,7 +51,6 @@ module Gitlab
before_transition any => :verification_started do |instance, _| before_transition any => :verification_started do |instance, _|
instance.verification_started_at = Time.current instance.verification_started_at = Time.current
instance.verification_failure = nil
end end
before_transition any => :verification_pending do |instance, _| before_transition any => :verification_pending do |instance, _|
...@@ -76,7 +75,7 @@ module Gitlab ...@@ -76,7 +75,7 @@ module Gitlab
end end
event :verification_started do event :verification_started do
transition [:verification_pending, :verification_succeeded, :verification_failed] => :verification_started transition [:verification_pending, :verification_started, :verification_succeeded, :verification_failed] => :verification_started
end end
event :verification_succeeded do event :verification_succeeded do
...@@ -102,10 +101,21 @@ module Gitlab ...@@ -102,10 +101,21 @@ module Gitlab
# Convenience method to update checksum and transition to success state. # Convenience method to update checksum and transition to success state.
# #
# @param [String] checksum value generated by the checksum routine # @param [String] checksum value generated by the checksum routine
def verification_succeeded_with_checksum!(checksum) # @param [DateTime] calculation_started_at the moment just before the
# checksum routine was called
def verification_succeeded_with_checksum!(checksum, calculation_started_at)
self.verification_checksum = checksum self.verification_checksum = checksum
self.verification_succeeded! self.verification_succeeded!
if resource_updated_during_checksum?(calculation_started_at)
# just let backfill pick it up
self.verification_pending!
end
end
def resource_updated_during_checksum?(calculation_started_at)
self.reset.verification_started_at > calculation_started_at
end end
# Convenience method to update failure message and transition to failed # Convenience method to update failure message and transition to failed
......
...@@ -27,13 +27,28 @@ RSpec.describe Gitlab::Geo::VerificationState do ...@@ -27,13 +27,28 @@ RSpec.describe Gitlab::Geo::VerificationState do
subject { DummyModel.new } subject { DummyModel.new }
describe '#verification_succeeded_with_checksum!' do describe '#verification_succeeded_with_checksum!' do
context 'when the resource was updated during checksum calculation' do
let(:calculation_started_at) { subject.verification_started_at - 1.second }
it 'sets state to pending' do
subject.verification_succeeded_with_checksum!('abc123', calculation_started_at)
expect(subject.reload.verification_pending?).to be_truthy
end
end
context 'when the resource was not updated during checksum calculation' do
let(:calculation_started_at) { subject.verification_started_at + 1.second }
it 'saves the checksum' do it 'saves the checksum' do
subject.verification_succeeded_with_checksum!('abc123') subject.verification_succeeded_with_checksum!('abc123', calculation_started_at)
expect(subject.reload.verification_succeeded?).to be_truthy
expect(subject.reload.verification_checksum).to eq('abc123') expect(subject.reload.verification_checksum).to eq('abc123')
expect(subject.verified_at).not_to be_nil expect(subject.verified_at).not_to be_nil
end end
end end
end
describe '#verification_failed_with_message!' do describe '#verification_failed_with_message!' do
it 'saves the error message and increments retry counter' do it 'saves the error message and increments retry counter' do
...@@ -41,6 +56,7 @@ RSpec.describe Gitlab::Geo::VerificationState do ...@@ -41,6 +56,7 @@ RSpec.describe Gitlab::Geo::VerificationState do
subject.verification_failed_with_message!('Failure to calculate checksum', error) subject.verification_failed_with_message!('Failure to calculate checksum', error)
expect(subject.reload.verification_failed?).to be_truthy
expect(subject.reload.verification_failure).to eq 'Failure to calculate checksum: An error message' expect(subject.reload.verification_failure).to eq 'Failure to calculate checksum: An error message'
expect(subject.verification_retry_count).to be 1 expect(subject.verification_retry_count).to be 1
end end
......
...@@ -122,12 +122,26 @@ RSpec.shared_examples 'a verifiable replicator' do ...@@ -122,12 +122,26 @@ RSpec.shared_examples 'a verifiable replicator' do
end end
end end
describe '#verify' do describe '#verify_async' do
before do before do
model_record.verification_started
model_record.save! model_record.save!
end end
context 'on a Geo primary' do
before do
stub_primary_node
end
it 'calls verification_started! and enqueues VerificationWorker' do
expect(model_record).to receive(:verification_started!)
expect(Geo::VerificationWorker).to receive(:perform_async).with(replicator.replicable_name, model_record.id)
replicator.verify_async
end
end
end
describe '#verify' do
context 'on a Geo primary' do context 'on a Geo primary' do
before do before do
stub_primary_node stub_primary_node
...@@ -141,7 +155,7 @@ RSpec.shared_examples 'a verifiable replicator' do ...@@ -141,7 +155,7 @@ RSpec.shared_examples 'a verifiable replicator' do
context 'when the checksum succeeds' do context 'when the checksum succeeds' do
it 'delegates checksum calculation and the state change to model_record' do it 'delegates checksum calculation and the state change to model_record' do
expect(model_record).to receive(:calculate_checksum).and_return('abc123') expect(model_record).to receive(:calculate_checksum).and_return('abc123')
expect(model_record).to receive(:verification_succeeded_with_checksum!).with('abc123') expect(model_record).to receive(:verification_succeeded_with_checksum!).with('abc123', kind_of(Time))
replicator.verify replicator.verify
end end
...@@ -160,6 +174,14 @@ RSpec.shared_examples 'a verifiable replicator' do ...@@ -160,6 +174,14 @@ RSpec.shared_examples 'a verifiable replicator' do
end end
end end
end end
context 'when verification was not started' do
it 'does not call calculate_checksum!' do
expect(model_record).not_to receive(:calculate_checksum)
replicator.verify
end
end
end end
end end
end end
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment