Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
G
gitlab-ce
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
1
Merge Requests
1
Analytics
Analytics
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Commits
Issue Boards
Open sidebar
nexedi
gitlab-ce
Commits
b1515009
Commit
b1515009
authored
Feb 26, 2018
by
Douglas Barbosa Alexandre
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
Fix repository synchronization order for projects updated recently
parent
8b0345d7
Changes
3
Show whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
75 additions
and
20 deletions
+75
-20
ee/app/finders/geo/project_registry_finder.rb
ee/app/finders/geo/project_registry_finder.rb
+19
-5
ee/app/workers/geo/repository_shard_sync_worker.rb
ee/app/workers/geo/repository_shard_sync_worker.rb
+1
-1
ee/spec/workers/geo/repository_shard_sync_worker_spec.rb
ee/spec/workers/geo/repository_shard_sync_worker_spec.rb
+55
-14
No files found.
ee/app/finders/geo/project_registry_finder.rb
View file @
b1515009
...
...
@@ -141,11 +141,25 @@ module Geo
# @return [ActiveRecord::Relation<Project>] list of projects updated recently
def
legacy_find_projects_updated_recently
legacy_inner_join_registry_ids
(
current_node
.
projects
,
Geo
::
ProjectRegistry
.
dirty
.
retry_due
.
pluck
(
:project_id
),
Project
)
registries
=
Geo
::
ProjectRegistry
.
dirty
.
retry_due
.
pluck
(
:project_id
,
:last_repository_successful_sync_at
)
return
Project
.
none
if
registries
.
empty?
id_and_last_sync_values
=
registries
.
map
do
|
id
,
last_repository_successful_sync_at
|
"(
#{
id
}
,
#{
quote_value
(
last_repository_successful_sync_at
)
}
)"
end
joined_relation
=
current_node
.
projects
.
joins
(
<<~
SQL
)
INNER JOIN
(VALUES
#{
id_and_last_sync_values
.
join
(
','
)
}
)
project_registry(id, last_repository_successful_sync_at)
ON
#{
Project
.
table_name
}
.id = project_registry.id
SQL
joined_relation
end
def
quote_value
(
value
)
::
Gitlab
::
SQL
::
Glob
.
q
(
value
)
end
# @return [ActiveRecord::Relation<Geo::ProjectRegistry>] list of synced projects
...
...
ee/app/workers/geo/repository_shard_sync_worker.rb
View file @
b1515009
...
...
@@ -65,7 +65,7 @@ module Geo
def
find_project_ids_updated_recently
(
batch_size
:)
shard_restriction
(
finder
.
find_projects_updated_recently
(
batch_size:
batch_size
))
.
order
(
Gitlab
::
Database
.
nulls_first_order
(
:last_repository_updated_at
,
:desc
)
)
.
order
(
'project_registry.last_repository_successful_sync_at ASC NULLS FIRST, projects.last_repository_updated_at ASC'
)
.
pluck
(
:id
)
end
...
...
ee/spec/workers/geo/repository_shard_sync_worker_spec.rb
View file @
b1515009
...
...
@@ -7,12 +7,13 @@ describe Geo::RepositoryShardSyncWorker, :geo, :delete, :clean_gitlab_redis_cach
let!
(
:primary
)
{
create
(
:geo_node
,
:primary
)
}
let!
(
:secondary
)
{
create
(
:geo_node
)
}
let!
(
:synced_group
)
{
create
(
:group
)
}
let!
(
:project_in_synced_group
)
{
create
(
:project
,
group:
synced_group
)
}
let!
(
:restricted_group
)
{
create
(
:group
)
}
let!
(
:unsynced_project_in_restricted_group
)
{
create
(
:project
,
group:
restricted_group
)
}
let!
(
:unsynced_project
)
{
create
(
:project
)
}
let
(
:shard_name
)
{
Gitlab
.
config
.
repositories
.
storages
.
keys
.
first
}
subject
{
described_class
.
new
}
let
(
:shard_name
)
{
Gitlab
.
config
.
repositories
.
storages
.
keys
.
first
}
before
do
stub_current_geo_node
(
secondary
)
...
...
@@ -37,7 +38,7 @@ describe Geo::RepositoryShardSyncWorker, :geo, :delete, :clean_gitlab_redis_cach
end
it
'performs Geo::ProjectSyncWorker for projects where last attempt to sync failed'
do
create
(
:geo_project_registry
,
:sync_failed
,
project:
project_in_sync
ed_group
)
create
(
:geo_project_registry
,
:sync_failed
,
project:
unsynced_project_in_restrict
ed_group
)
create
(
:geo_project_registry
,
:synced
,
project:
unsynced_project
)
expect
(
Geo
::
ProjectSyncWorker
).
to
receive
(
:perform_async
).
once
.
and_return
(
spy
)
...
...
@@ -54,7 +55,7 @@ describe Geo::RepositoryShardSyncWorker, :geo, :delete, :clean_gitlab_redis_cach
end
it
'performs Geo::ProjectSyncWorker for synced projects updated recently'
do
create
(
:geo_project_registry
,
:synced
,
:repository_dirty
,
project:
project_in_sync
ed_group
)
create
(
:geo_project_registry
,
:synced
,
:repository_dirty
,
project:
unsynced_project_in_restrict
ed_group
)
create
(
:geo_project_registry
,
:synced
,
project:
unsynced_project
)
create
(
:geo_project_registry
,
:synced
,
:wiki_dirty
)
...
...
@@ -104,12 +105,12 @@ describe Geo::RepositoryShardSyncWorker, :geo, :delete, :clean_gitlab_redis_cach
context
'when node has namespace restrictions'
do
before
do
secondary
.
update!
(
selective_sync_type:
'namespaces'
,
namespaces:
[
sync
ed_group
])
secondary
.
update!
(
selective_sync_type:
'namespaces'
,
namespaces:
[
restrict
ed_group
])
end
it
'does not perform Geo::ProjectSyncWorker for projects that do not belong to selected namespaces to replicate'
do
expect
(
Geo
::
ProjectSyncWorker
).
to
receive
(
:perform_async
)
.
with
(
project_in_sync
ed_group
.
id
,
within
(
1
.
minute
).
of
(
Time
.
now
))
.
with
(
unsynced_project_in_restrict
ed_group
.
id
,
within
(
1
.
minute
).
of
(
Time
.
now
))
.
once
.
and_return
(
spy
)
...
...
@@ -117,11 +118,11 @@ describe Geo::RepositoryShardSyncWorker, :geo, :delete, :clean_gitlab_redis_cach
end
it
'does not perform Geo::ProjectSyncWorker for synced projects updated recently that do not belong to selected namespaces to replicate'
do
create
(
:geo_project_registry
,
:synced
,
:repository_dirty
,
project:
project_in_sync
ed_group
)
create
(
:geo_project_registry
,
:synced
,
:repository_dirty
,
project:
unsynced_project_in_restrict
ed_group
)
create
(
:geo_project_registry
,
:synced
,
:repository_dirty
,
project:
unsynced_project
)
expect
(
Geo
::
ProjectSyncWorker
).
to
receive
(
:perform_async
)
.
with
(
project_in_sync
ed_group
.
id
,
within
(
1
.
minute
).
of
(
Time
.
now
))
.
with
(
unsynced_project_in_restrict
ed_group
.
id
,
within
(
1
.
minute
).
of
(
Time
.
now
))
.
once
.
and_return
(
spy
)
...
...
@@ -129,13 +130,53 @@ describe Geo::RepositoryShardSyncWorker, :geo, :delete, :clean_gitlab_redis_cach
end
end
context
'repositories that have never been updated'
do
let!
(
:project_list
)
{
create_list
(
:project
,
4
,
last_repository_updated_at:
2
.
hours
.
ago
)
}
let!
(
:abandoned_project
)
{
create
(
:project
)
}
before
do
# Project sync failed but never received an update
create
(
:geo_project_registry
,
:repository_sync_failed
,
project:
abandoned_project
)
abandoned_project
.
update_column
(
:last_repository_updated_at
,
1
.
year
.
ago
)
# Neither of these are needed for this spec
unsynced_project
.
destroy
unsynced_project_in_restricted_group
.
destroy
allow_any_instance_of
(
described_class
).
to
receive
(
:db_retrieve_batch_size
).
and_return
(
2
)
# Must be >1 because of the Geo::BaseSchedulerWorker#interleave
secondary
.
update!
(
repos_max_capacity:
3
)
# Must be more than db_retrieve_batch_size
project_list
.
each
do
|
project
|
allow
(
Geo
::
ProjectSyncWorker
)
.
to
receive
(
:perform_async
)
.
with
(
project
.
id
,
anything
)
.
and_call_original
end
allow_any_instance_of
(
Geo
::
ProjectRegistry
).
to
receive
(
:wiki_sync_due?
).
and_return
(
false
)
allow_any_instance_of
(
Geo
::
RepositorySyncService
).
to
receive
(
:expire_repository_caches
)
end
it
'tries to sync project where last attempt to sync failed'
do
expect
(
Geo
::
ProjectSyncWorker
)
.
to
receive
(
:perform_async
)
.
with
(
abandoned_project
.
id
,
anything
)
.
at_least
(
:once
)
.
and_return
(
spy
)
3
.
times
do
Sidekiq
::
Testing
.
inline!
{
subject
.
perform
(
shard_name
)
}
end
end
end
context
'all repositories fail'
do
let!
(
:project_list
)
{
create_list
(
:project
,
4
,
:random_last_repository_updated_at
)
}
before
do
# Neither of these are needed for this spec
unsynced_project
.
destroy
project_in_sync
ed_group
.
destroy
unsynced_project_in_restrict
ed_group
.
destroy
allow_any_instance_of
(
described_class
).
to
receive
(
:db_retrieve_batch_size
).
and_return
(
2
)
# Must be >1 because of the Geo::BaseSchedulerWorker#interleave
secondary
.
update!
(
repos_max_capacity:
3
)
# Must be more than db_retrieve_batch_size
...
...
@@ -161,14 +202,14 @@ describe Geo::RepositoryShardSyncWorker, :geo, :delete, :clean_gitlab_redis_cach
context
'additional shards'
do
it
'skips backfill for projects on unhealthy shards'
do
missing_not_synced
=
create
(
:project
,
group:
sync
ed_group
)
missing_not_synced
=
create
(
:project
,
group:
restrict
ed_group
)
missing_not_synced
.
update_column
(
:repository_storage
,
'unknown'
)
missing_dirty
=
create
(
:project
,
group:
sync
ed_group
)
missing_dirty
=
create
(
:project
,
group:
restrict
ed_group
)
missing_dirty
.
update_column
(
:repository_storage
,
'unknown'
)
create
(
:geo_project_registry
,
:synced
,
:repository_dirty
,
project:
missing_dirty
)
expect
(
Geo
::
ProjectSyncWorker
).
to
receive
(
:perform_async
).
with
(
project_in_sync
ed_group
.
id
,
anything
)
expect
(
Geo
::
ProjectSyncWorker
).
to
receive
(
:perform_async
).
with
(
unsynced_project_in_restrict
ed_group
.
id
,
anything
)
expect
(
Geo
::
ProjectSyncWorker
).
not_to
receive
(
:perform_async
).
with
(
missing_not_synced
.
id
,
anything
)
expect
(
Geo
::
ProjectSyncWorker
).
not_to
receive
(
:perform_async
).
with
(
missing_dirty
.
id
,
anything
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment