Commit b204d11c authored by Tiago Botelho's avatar Tiago Botelho

Adds background migrations

parent 35b61707
...@@ -651,80 +651,87 @@ class Project < ActiveRecord::Base ...@@ -651,80 +651,87 @@ class Project < ActiveRecord::Base
import_started? || import_scheduled? import_started? || import_scheduled?
end end
def ensure_import_state(param) def import_state_args
return unless self[param] && import_state.nil? {
status: self[:import_status],
jid: self[:import_jid],
last_error: self[:import_error]
}
end
def ensure_import_state
return if self[:import_status] == 'none' || self[:import_status].nil?
return unless import_state.nil?
create_import_state(status: self[:import_status], create_import_state(import_state_args)
jid: self[:import_jid],
last_error: self[:import_error])
update(import_status: nil) update_column(:import_status, 'none')
end end
def import_schedule def import_schedule
ensure_import_state(:import_status) ensure_import_state
import_state&.schedule import_state&.schedule
end end
def force_import_start def force_import_start
ensure_import_state(:import_status) ensure_import_state
import_state&.force_start import_state&.force_start
end end
def import_start def import_start
ensure_import_state(:import_status) ensure_import_state
import_state&.start import_state&.start
end end
def import_fail def import_fail
ensure_import_state(:import_status) ensure_import_state
import_state&.fail_op import_state&.fail_op
end end
def import_finish def import_finish
ensure_import_state(:import_status) ensure_import_state
import_state&.finish import_state&.finish
end end
def import_jid=(new_jid) def import_jid=(new_jid)
return super unless import_state ensure_import_state
import_state.jid = new_jid import_state&.jid = new_jid
end end
def import_jid def import_jid
ensure_import_state(:import_jid) ensure_import_state
import_state&.jid import_state&.jid
end end
def import_error=(new_error) def import_error=(new_error)
return super unless import_state ensure_import_state
import_state.last_error = new_error import_state&.last_error = new_error
end end
def import_error def import_error
ensure_import_state(:import_error) ensure_import_state
import_state&.last_error import_state&.last_error
end end
def import_status=(new_status) def import_status=(new_status)
return super unless import_state ensure_import_state
import_state.status = new_status import_state&.status = new_status
end end
def import_status def import_status
ensure_import_state(:import_status) ensure_import_state
import_state&.status import_state&.status || 'none'
end end
def no_import? def no_import?
...@@ -1588,8 +1595,7 @@ class Project < ActiveRecord::Base ...@@ -1588,8 +1595,7 @@ class Project < ActiveRecord::Base
Gitlab::SidekiqStatus.unset(import_jid) Gitlab::SidekiqStatus.unset(import_jid)
self.import_jid = nil import_state.update_column(:jid, nil)
self.save(validate: false)
end end
def running_or_pending_build_count(force: false) def running_or_pending_build_count(force: false)
...@@ -1609,8 +1615,7 @@ class Project < ActiveRecord::Base ...@@ -1609,8 +1615,7 @@ class Project < ActiveRecord::Base
import_fail import_fail
self.import_error = sanitized_message import_state.update_column(:last_error, sanitized_message)
self.save(validate: false)
rescue ActiveRecord::ActiveRecordError => e rescue ActiveRecord::ActiveRecordError => e
Rails.logger.error("Error setting import status to failed: #{e.message}. Original error: #{sanitized_message}") Rails.logger.error("Error setting import status to failed: #{e.message}. Original error: #{sanitized_message}")
ensure ensure
......
...@@ -64,10 +64,8 @@ module Gitlab ...@@ -64,10 +64,8 @@ module Gitlab
def find_project(id) def find_project(id)
# TODO: Only select the JID # TODO: Only select the JID
# We only care about the import JID so we can refresh it. We also only # This is due to the fact that the JID could be present in either the project record or
# want the project if it hasn't been marked as failed yet. It's possible # its associated import_state record
# the import gets marked as stuck when jobs of the current stage failed
# somehow.
Project.import_started.find_by(id: id) Project.import_started.find_by(id: id)
end end
end end
......
...@@ -31,7 +31,9 @@ module Gitlab ...@@ -31,7 +31,9 @@ module Gitlab
end end
def find_project(id) def find_project(id)
# TODO: select only import_jid # TODO: Only select the JID
# This is due to the fact that the JID could be present in either the project record or
# its associated import_state record
Project.import_started.find_by(id: id) Project.import_started.find_by(id: id)
end end
end end
......
class AddIndexesToProjectMirrorData < ActiveRecord::Migration
include Gitlab::Database::MigrationHelpers
DOWNTIME = false
disable_ddl_transaction!
def up
add_concurrent_index :project_mirror_data, :last_successful_update_at
add_concurrent_index :project_mirror_data, :jid
add_concurrent_index :project_mirror_data, :status
end
def down
remove_index :project_mirror_data, :last_successful_update_at if index_exists? :project_mirror_data, :last_successful_update_at
remove_index :project_mirror_data, :jid if index_exists? :project_mirror_data, :jid
remove_index :project_mirror_data, :status if index_exists? :project_mirror_data, :status
end
end
...@@ -3,6 +3,12 @@ class MigrateImportAttributesDataFromProjectsToProjectMirrorData < ActiveRecord: ...@@ -3,6 +3,12 @@ class MigrateImportAttributesDataFromProjectsToProjectMirrorData < ActiveRecord:
DOWNTIME = false DOWNTIME = false
UP_MIGRATION = 'PopulateImportState'.freeze
DOWN_MIGRATION = 'RollbackImportStateData'.freeze
BATCH_SIZE = 1000
DELAY_INTERVAL = 5.minutes
disable_ddl_transaction! disable_ddl_transaction!
class Project < ActiveRecord::Base class Project < ActiveRecord::Base
...@@ -18,54 +24,14 @@ class MigrateImportAttributesDataFromProjectsToProjectMirrorData < ActiveRecord: ...@@ -18,54 +24,14 @@ class MigrateImportAttributesDataFromProjectsToProjectMirrorData < ActiveRecord:
end end
def up def up
Project.where.not(import_status: nil).each_batch do |batch| projects = Project.where.not(import_status: :none)
start, stop = batch.pluck('MIN(id), MAX(id)').first
execute <<~SQL queue_background_migration_jobs_by_range_at_intervals(projects, UP_MIGRATION, DELAY_INTERVAL, batch_size: BATCH_SIZE)
INSERT INTO project_mirror_data (project_id, status, jid, last_update_at, last_successful_update_at, last_error)
SELECT id, import_status, import_jid, mirror_last_update_at, mirror_last_successful_update_at, import_error
FROM projects proj
WHERE proj.import_status IS NOT NULL
AND proj.id >= #{start}
AND proj.id < #{stop}
SQL
execute <<~SQL
UPDATE projects
SET import_status = NULL
WHERE import_status IS NOT NULL
AND id >= #{start}
AND id < #{stop}
SQL
end
end end
def down def down
ProjectImportState.where.not(status: nil).each_batch do |batch| import_state = ProjectImportState.where.not(status: :none)
start, stop = batch.pluck('MIN(id), MAX(id)').first
execute <<~SQL
UPDATE projects
SET
import_status = mirror_data.status,
import_jid = mirror_data.jid,
mirror_last_update_at = mirror_data.last_update_at,
mirror_last_successful_update_at = mirror_data.last_successful_update_at,
import_error = mirror_data.last_error
FROM project_mirror_data mirror_data
WHERE mirror_data.project_id = projects.id
AND mirror_data.status IS NOT NULL
AND mirror_data.id >= #{start}
AND mirror_data.id < #{stop}
SQL
execute <<~SQL queue_background_migration_jobs_by_range_at_intervals(import_state, DOWN_MIGRATION, DELAY_INTERVAL, batch_size: BATCH_SIZE)
UPDATE project_mirror_data
SET status = NULL
WHERE status IS NOT NULL
AND id >= #{start}
AND id < #{stop}
SQL
end
end end
end end
class MigrateMirrorAttributesDataFromProjectsToImportState < ActiveRecord::Migration
include Gitlab::Database::MigrationHelpers
DOWNTIME = false
disable_ddl_transaction!
class Project < ActiveRecord::Base
include EachBatch
self.table_name = 'projects'
end
def up
Project.joins('INNER JOIN project_mirror_data ON project_mirror_data.project_id = projects.id').each_batch do |batch|
start, stop = batch.pluck('MIN(projects.id), MAX(projects.id)').first
execute <<~SQL
UPDATE project_mirror_data
SET
status = proj.import_status,
jid = proj.import_jid,
last_update_at = proj.mirror_last_update_at,
last_successful_update_at = proj.mirror_last_successful_update_at,
last_error = proj.import_error
FROM projects proj
WHERE proj.id = project_id
AND proj.mirror = TRUE
AND proj.id >= #{start}
AND proj.id < #{stop}
SQL
execute <<~SQL
UPDATE projects
SET import_status = NULL
WHERE mirror = TRUE
AND id >= #{start}
AND id < #{stop}
SQL
end
end
def down
Project.joins('INNER JOIN project_mirror_data ON project_mirror_data.project_id = projects.id').each_batch do |batch|
start, stop = batch.pluck('MIN(projects.id), MAX(projects.id)').first
execute <<~SQL
UPDATE projects
SET
projects.import_status = import_state.status,
projects.import_jid = import_state.jid,
projects.mirror_last_update_at = import_state.last_update_at,
projects.mirror_last_successful_update_at = import_state.last_successful_update_at,
projects.import_error = import_state.last_error
FROM project_mirror_data import_state
WHERE import_state.project_id = projects.id
AND projects.mirror = TRUE
AND projects.id >= #{start}
AND projects.id < #{stop}
SQL
execute <<~SQL
UPDATE project_mirror_data
SET
status = NULL
FROM projects proj
WHERE proj.id = project_id
AND proj.mirror = TRUE
AND proj.id >= #{start}
AND proj.id < #{stop}
SQL
end
end
end
...@@ -11,7 +11,7 @@ ...@@ -11,7 +11,7 @@
# #
# It's strongly recommended that you check this file into your version control system. # It's strongly recommended that you check this file into your version control system.
ActiveRecord::Schema.define(version: 20180503150427) do ActiveRecord::Schema.define(version: 20180503154922) do
# These are extensions that must be enabled in order to support this database # These are extensions that must be enabled in order to support this database
enable_extension "plpgsql" enable_extension "plpgsql"
...@@ -1987,8 +1987,11 @@ ActiveRecord::Schema.define(version: 20180503150427) do ...@@ -1987,8 +1987,11 @@ ActiveRecord::Schema.define(version: 20180503150427) do
t.text "last_error" t.text "last_error"
end end
add_index "project_mirror_data", ["jid"], name: "index_project_mirror_data_on_jid", using: :btree
add_index "project_mirror_data", ["last_successful_update_at"], name: "index_project_mirror_data_on_last_successful_update_at", using: :btree
add_index "project_mirror_data", ["next_execution_timestamp", "retry_count"], name: "index_mirror_data_on_next_execution_and_retry_count", using: :btree add_index "project_mirror_data", ["next_execution_timestamp", "retry_count"], name: "index_mirror_data_on_next_execution_and_retry_count", using: :btree
add_index "project_mirror_data", ["project_id"], name: "index_project_mirror_data_on_project_id", unique: true, using: :btree add_index "project_mirror_data", ["project_id"], name: "index_project_mirror_data_on_project_id", unique: true, using: :btree
add_index "project_mirror_data", ["status"], name: "index_project_mirror_data_on_status", using: :btree
create_table "project_repository_states", force: :cascade do |t| create_table "project_repository_states", force: :cascade do |t|
t.integer "project_id", null: false t.integer "project_id", null: false
...@@ -2031,6 +2034,7 @@ ActiveRecord::Schema.define(version: 20180503150427) do ...@@ -2031,6 +2034,7 @@ ActiveRecord::Schema.define(version: 20180503150427) do
t.integer "visibility_level", default: 0, null: false t.integer "visibility_level", default: 0, null: false
t.boolean "archived", default: false, null: false t.boolean "archived", default: false, null: false
t.string "avatar" t.string "avatar"
t.string "import_status"
t.text "merge_requests_template" t.text "merge_requests_template"
t.integer "star_count", default: 0, null: false t.integer "star_count", default: 0, null: false
t.boolean "merge_requests_rebase_enabled", default: false t.boolean "merge_requests_rebase_enabled", default: false
...@@ -2041,7 +2045,10 @@ ActiveRecord::Schema.define(version: 20180503150427) do ...@@ -2041,7 +2045,10 @@ ActiveRecord::Schema.define(version: 20180503150427) do
t.boolean "merge_requests_ff_only_enabled", default: false t.boolean "merge_requests_ff_only_enabled", default: false
t.text "issues_template" t.text "issues_template"
t.boolean "mirror", default: false, null: false t.boolean "mirror", default: false, null: false
t.datetime "mirror_last_update_at"
t.datetime "mirror_last_successful_update_at"
t.integer "mirror_user_id" t.integer "mirror_user_id"
t.text "import_error"
t.integer "ci_id" t.integer "ci_id"
t.boolean "shared_runners_enabled", default: true, null: false t.boolean "shared_runners_enabled", default: true, null: false
t.string "runners_token" t.string "runners_token"
...@@ -2068,6 +2075,7 @@ ActiveRecord::Schema.define(version: 20180503150427) do ...@@ -2068,6 +2075,7 @@ ActiveRecord::Schema.define(version: 20180503150427) do
t.boolean "printing_merge_request_link_enabled", default: true, null: false t.boolean "printing_merge_request_link_enabled", default: true, null: false
t.integer "auto_cancel_pending_pipelines", default: 1, null: false t.integer "auto_cancel_pending_pipelines", default: 1, null: false
t.boolean "service_desk_enabled", default: true t.boolean "service_desk_enabled", default: true
t.string "import_jid"
t.integer "cached_markdown_version" t.integer "cached_markdown_version"
t.text "delete_error" t.text "delete_error"
t.datetime "last_repository_updated_at" t.datetime "last_repository_updated_at"
...@@ -2082,11 +2090,6 @@ ActiveRecord::Schema.define(version: 20180503150427) do ...@@ -2082,11 +2090,6 @@ ActiveRecord::Schema.define(version: 20180503150427) do
t.string "external_authorization_classification_label" t.string "external_authorization_classification_label"
t.string "external_webhook_token" t.string "external_webhook_token"
t.boolean "pages_https_only", default: true t.boolean "pages_https_only", default: true
t.string "import_status"
t.string "import_jid"
t.datetime_with_timezone "mirror_last_update_at"
t.datetime_with_timezone "mirror_last_successful_update_at"
t.text "import_error"
end end
add_index "projects", ["ci_id"], name: "index_projects_on_ci_id", using: :btree add_index "projects", ["ci_id"], name: "index_projects_on_ci_id", using: :btree
...@@ -2098,6 +2101,7 @@ ActiveRecord::Schema.define(version: 20180503150427) do ...@@ -2098,6 +2101,7 @@ ActiveRecord::Schema.define(version: 20180503150427) do
add_index "projects", ["last_activity_at"], name: "index_projects_on_last_activity_at", using: :btree add_index "projects", ["last_activity_at"], name: "index_projects_on_last_activity_at", using: :btree
add_index "projects", ["last_repository_check_failed"], name: "index_projects_on_last_repository_check_failed", using: :btree add_index "projects", ["last_repository_check_failed"], name: "index_projects_on_last_repository_check_failed", using: :btree
add_index "projects", ["last_repository_updated_at"], name: "index_projects_on_last_repository_updated_at", using: :btree add_index "projects", ["last_repository_updated_at"], name: "index_projects_on_last_repository_updated_at", using: :btree
add_index "projects", ["mirror_last_successful_update_at"], name: "index_projects_on_mirror_last_successful_update_at", using: :btree
add_index "projects", ["name"], name: "index_projects_on_name_trigram", using: :gin, opclasses: {"name"=>"gin_trgm_ops"} add_index "projects", ["name"], name: "index_projects_on_name_trigram", using: :gin, opclasses: {"name"=>"gin_trgm_ops"}
add_index "projects", ["namespace_id"], name: "index_projects_on_namespace_id", using: :btree add_index "projects", ["namespace_id"], name: "index_projects_on_namespace_id", using: :btree
add_index "projects", ["path"], name: "index_projects_on_path", using: :btree add_index "projects", ["path"], name: "index_projects_on_path", using: :btree
......
...@@ -16,6 +16,7 @@ module EE ...@@ -16,6 +16,7 @@ module EE
before_validation :mark_remote_mirrors_for_removal before_validation :mark_remote_mirrors_for_removal
before_save :set_override_pull_mirror_available, unless: -> { ::Gitlab::CurrentSettings.mirror_available } before_save :set_override_pull_mirror_available, unless: -> { ::Gitlab::CurrentSettings.mirror_available }
before_save :set_next_execution_timestamp_to_now, if: ->(project) { project.mirror? && project.mirror_changed? && project.import_state }
after_update :remove_mirror_repository_reference, after_update :remove_mirror_repository_reference,
if: ->(project) { project.mirror? && project.import_url_updated? } if: ->(project) { project.mirror? && project.import_url_updated? }
...@@ -134,39 +135,31 @@ module EE ...@@ -134,39 +135,31 @@ module EE
mirror? && !empty_repo? mirror? && !empty_repo?
end end
override :ensure_import_state def import_state_args
def ensure_import_state(param) super.merge(last_update_at: self[:mirror_last_update_at],
return unless self[param] && import_state.nil? last_successful_update_at: self[:mirror_last_successful_update_at])
create_import_state(status: self[:import_status],
jid: self[:import_jid],
last_error: self[:import_error],
last_update_at: self[:mirror_last_update_at],
last_successful_update_at: self[:mirror_last_successful_update_at])
update(import_status: nil)
end end
def mirror_last_update_at=(new_value) def mirror_last_update_at=(new_value)
return super unless import_state ensure_import_state
import_state.last_update_at = new_value import_state&.last_update_at = new_value
end end
def mirror_last_update_at def mirror_last_update_at
ensure_import_state(:mirror_last_update_at) ensure_import_state
import_state&.last_update_at import_state&.last_update_at
end end
def mirror_last_successful_update_at=(new_value) def mirror_last_successful_update_at=(new_value)
return super unless import_state ensure_import_state
import_state.last_successful_update_at = new_value import_state&.last_successful_update_at = new_value
end end
def mirror_last_successful_update_at def mirror_last_successful_update_at
ensure_import_state(:mirror_last_successful_update_at) ensure_import_state
import_state&.last_successful_update_at import_state&.last_successful_update_at
end end
...@@ -548,6 +541,10 @@ module EE ...@@ -548,6 +541,10 @@ module EE
true true
end end
def set_next_execution_timestamp_to_now
import_state.set_next_execution_to_now
end
def licensed_feature_available?(feature) def licensed_feature_available?(feature)
available_features = strong_memoize(:licensed_feature_available) do available_features = strong_memoize(:licensed_feature_available) do
Hash.new do |h, feature| Hash.new do |h, feature|
......
...@@ -89,7 +89,7 @@ module EE ...@@ -89,7 +89,7 @@ module EE
end end
def set_next_execution_to_now def set_next_execution_to_now
return unless mirror? return unless project.mirror?
self.next_execution_timestamp = Time.now self.next_execution_timestamp = Time.now
end end
......
---
title: Improves database performance of mirrors, forks and imports
merge_request: 5522
author:
type: performance
class MigrateMirrorAttributesDataFromProjectsToImportState < ActiveRecord::Migration
include Gitlab::Database::MigrationHelpers
DOWNTIME = false
disable_ddl_transaction!
class Project < ActiveRecord::Base
include EachBatch
self.table_name = 'projects'
scope :join_mirror_data, -> { joins('INNER JOIN project_mirror_data ON project_mirror_data.project_id = projects.id') }
end
def up
Project.join_mirror_data.each_batch do |batch|
start, stop = batch.pluck('MIN(projects.id), MAX(projects.id)').first
if Gitlab::Database.mysql?
execute <<~SQL
UPDATE project_mirror_data, projects
SET
project_mirror_data.status = projects.import_status,
project_mirror_data.jid = projects.import_jid,
project_mirror_data.last_update_at = projects.mirror_last_update_at,
project_mirror_data.last_successful_update_at = projects.mirror_last_successful_update_at,
project_mirror_data.last_error = projects.import_error
WHERE projects.id = project_mirror_data.project_id
AND projects.mirror = TRUE
AND projects.id BETWEEN #{start} AND #{stop}
SQL
else
execute <<~SQL
UPDATE project_mirror_data
SET
status = projects.import_status,
jid = projects.import_jid,
last_update_at = projects.mirror_last_update_at,
last_successful_update_at = projects.mirror_last_successful_update_at,
last_error = projects.import_error
FROM projects
WHERE projects.id = project_id
AND projects.mirror = TRUE
AND projects.id BETWEEN #{start} AND #{stop}
SQL
end
execute <<~SQL
UPDATE projects
SET import_status = 'none'
WHERE mirror = TRUE
AND id BETWEEN #{start} AND #{stop}
SQL
end
end
def down
Project.join_mirror_data.each_batch do |batch|
start, stop = batch.pluck('MIN(projects.id), MAX(projects.id)').first
if Gitlab::Database.mysql?
execute <<~SQL
UPDATE projects, project_mirror_data
SET
projects.import_status = project_mirror_data.status,
projects.import_jid = project_mirror_data.jid,
projects.mirror_last_update_at = project_mirror_data.last_update_at,
projects.mirror_last_successful_update_at = project_mirror_data.last_successful_update_at,
projects.import_error = project_mirror_data.last_error
WHERE project_mirror_data.project_id = projects.id
AND projects.mirror = TRUE
AND projects.id BETWEEN #{start} AND #{stop}
SQL
execute <<~SQL
UPDATE project_mirror_data, projects
SET project_mirror_data.status = 'none'
WHERE projects.id = project_mirror_data.project_id
AND projects.mirror = TRUE
AND projects.id BETWEEN #{start} AND #{stop}
SQL
else
execute <<~SQL
UPDATE projects
SET
import_status = project_mirror_data.status,
import_jid = project_mirror_data.jid,
mirror_last_update_at = project_mirror_data.last_update_at,
mirror_last_successful_update_at = project_mirror_data.last_successful_update_at,
import_error = project_mirror_data.last_error
FROM project_mirror_data
WHERE project_mirror_data.project_id = projects.id
AND projects.mirror = TRUE
AND projects.id BETWEEN #{start} AND #{stop}
SQL
execute <<~SQL
UPDATE project_mirror_data
SET status = 'none'
FROM projects
WHERE projects.id = project_id
AND projects.mirror = TRUE
AND projects.id BETWEEN #{start} AND #{stop}
SQL
end
end
end
end
require 'spec_helper'
require Rails.root.join('ee', 'db', 'post_migrate', '20180430180136_migrate_mirror_attributes_data_from_projects_to_import_state.rb')
describe MigrateMirrorAttributesDataFromProjectsToImportState, :migration do
let(:namespaces) { table(:namespaces) }
let(:projects) { table(:projects) }
let(:import_state) { table(:project_mirror_data) }
describe '#up' do
before do
namespaces.create(id: 1, name: 'gitlab-org', path: 'gitlab-org')
projects.create!(id: 1, namespace_id: 1, name: 'gitlab1',
path: 'gitlab1', import_error: "foo", import_status: :started,
mirror: true, import_url: generate(:url))
projects.create!(id: 2, namespace_id: 1, name: 'gitlab2',
path: 'gitlab2', import_error: "foo", import_status: :finished,
mirror: false, import_url: generate(:url))
import_state.create!(id: 1, project_id: 1)
import_state.create!(id: 2, project_id: 2)
end
it 'migrates the mirror data to the import_state table' do
expect(projects.joins("INNER JOIN project_mirror_data ON project_mirror_data.project_id = projects.id").count).to eq(2)
expect do
subject.up
end.to change { projects.where(import_status: 'none').count }.from(0).to(1)
expect(import_state.first.status).to eq("started")
expect(import_state.first.last_error).to eq("foo")
expect(import_state.last.status).to be_nil
expect(import_state.last.last_error).to be_nil
end
end
describe '#down' do
before do
namespaces.create(id: 1, name: 'gitlab-org', path: 'gitlab-org')
projects.create!(id: 1, namespace_id: 1, name: 'gitlab1',
path: 'gitlab1', mirror: true, import_url: generate(:url))
import_state.create!(id: 1, project_id: 1, status: :started, last_error: "foo")
end
it 'migrates the import_state mirror data into the projects table' do
expect(projects.joins("INNER JOIN project_mirror_data ON project_mirror_data.project_id = projects.id").count).to eq(1)
expect do
subject.down
end.to change { import_state.where(status: 'none').count }.from(0).to(1)
expect(projects.first.import_status).to eq("started")
expect(projects.first.import_error).to eq("foo")
end
end
end
...@@ -48,6 +48,52 @@ describe Project do ...@@ -48,6 +48,52 @@ describe Project do
end end
end end
describe 'setting up a mirror' do
context 'when new project' do
it 'creates import_state and sets next_execution_timestamp to now' do
project = build(:project, :mirror)
Timecop.freeze do
expect do
project.save
end.to change { ProjectImportState.count }.by(1)
expect(project.import_state.next_execution_timestamp).to eq(Time.now)
end
end
end
context 'when project already exists' do
context 'when project is not import' do
it 'creates import_state and sets next_execution_timestamp to now' do
project = create(:project)
Timecop.freeze do
expect do
project.update_attributes(mirror: true, mirror_user_id: project.creator.id, import_url: generate(:url))
end.to change { ProjectImportState.count }.by(1)
expect(project.import_state.next_execution_timestamp).to eq(Time.now)
end
end
end
context 'when project is import' do
it 'sets current import_state next_execution_timestamp to now' do
project = create(:project, import_url: generate(:url))
Timecop.freeze do
expect do
project.update_attributes(mirror: true, mirror_user_id: project.creator.id)
end.not_to change { ProjectImportState.count }
expect(project.import_state.next_execution_timestamp).to eq(Time.now)
end
end
end
end
end
describe '.mirrors_to_sync' do describe '.mirrors_to_sync' do
let(:timestamp) { Time.now } let(:timestamp) { Time.now }
......
# frozen_string_literal: true
module Gitlab
module BackgroundMigration
# This background migration creates all the records on the
# import state table for projects that are considered imports or forks
class PopulateImportState
def perform(start_id, end_id)
move_attributes_data_to_import_state(start_id, end_id)
rescue ActiveRecord::RecordNotUnique
retry
end
def move_attributes_data_to_import_state(start_id, end_id)
Rails.logger.info("#{self.class.name} - Moving import attributes data to project mirror data table: #{start_id} - #{end_id}")
ActiveRecord::Base.connection.execute <<~SQL
INSERT INTO project_mirror_data (project_id, status, jid, last_update_at, last_successful_update_at, last_error)
SELECT id, import_status, import_jid, mirror_last_update_at, mirror_last_successful_update_at, import_error
FROM projects
WHERE projects.import_status != 'none'
AND projects.id BETWEEN #{start_id} AND #{end_id}
AND NOT EXISTS (
SELECT id
FROM project_mirror_data
WHERE project_id = projects.id
)
SQL
ActiveRecord::Base.connection.execute <<~SQL
UPDATE projects
SET import_status = 'none'
WHERE import_status != 'none'
AND id BETWEEN #{start_id} AND #{end_id}
SQL
end
end
end
end
# frozen_string_literal: true
module Gitlab
module BackgroundMigration
# This background migration migrates all the data of import_state
# back to the projects table for projects that are considered imports or forks
class RollbackImportStateData
def perform(start_id, end_id)
move_attributes_data_to_project(start_id, end_id)
end
def move_attributes_data_to_project(start_id, end_id)
Rails.logger.info("#{self.class.name} - Moving import attributes data to projects table: #{start_id} - #{end_id}")
if Gitlab::Database.mysql?
ActiveRecord::Base.connection.execute <<~SQL
UPDATE projects, project_mirror_data
SET
projects.import_status = project_mirror_data.status,
projects.import_jid = project_mirror_data.jid,
projects.mirror_last_update_at = project_mirror_data.last_update_at,
projects.mirror_last_successful_update_at = project_mirror_data.last_successful_update_at,
projects.import_error = project_mirror_data.last_error
WHERE project_mirror_data.project_id = projects.id
AND project_mirror_data.id BETWEEN #{start_id} AND #{end_id}
SQL
else
ActiveRecord::Base.connection.execute <<~SQL
UPDATE projects
SET
import_status = project_mirror_data.status,
import_jid = project_mirror_data.jid,
mirror_last_update_at = project_mirror_data.last_update_at,
mirror_last_successful_update_at = project_mirror_data.last_successful_update_at,
import_error = project_mirror_data.last_error
FROM project_mirror_data
WHERE project_mirror_data.project_id = projects.id
AND project_mirror_data.id BETWEEN #{start_id} AND #{end_id}
SQL
end
end
end
end
end
...@@ -43,7 +43,8 @@ module Gitlab ...@@ -43,7 +43,8 @@ module Gitlab
Gitlab::SidekiqStatus Gitlab::SidekiqStatus
.set(jid, StuckImportJobsWorker::IMPORT_JOBS_EXPIRATION) .set(jid, StuckImportJobsWorker::IMPORT_JOBS_EXPIRATION)
project.update_column(:import_jid, jid) project.ensure_import_state
project.import_state&.update_column(:jid, jid)
Stage::ImportRepositoryWorker Stage::ImportRepositoryWorker
.perform_async(project.id) .perform_async(project.id)
......
...@@ -78,7 +78,9 @@ module Gitlab ...@@ -78,7 +78,9 @@ module Gitlab
def handle_errors def handle_errors
return unless errors.any? return unless errors.any?
project.update_column(:import_error, { project.ensure_import_state
project.import_state&.update_column(:last_error, {
message: 'The remote data could not be fully imported.', message: 'The remote data could not be fully imported.',
errors: errors errors: errors
}.to_json) }.to_json)
......
...@@ -74,7 +74,7 @@ FactoryBot.define do ...@@ -74,7 +74,7 @@ FactoryBot.define do
end end
before(:create) do |project, evaluator| before(:create) do |project, evaluator|
project.create_import_state(status: evaluator.status) project.create_import_state(:status, evaluator.status)
end end
end end
...@@ -128,7 +128,6 @@ FactoryBot.define do ...@@ -128,7 +128,6 @@ FactoryBot.define do
project.create_import_state(status: evaluator.status, project.create_import_state(status: evaluator.status,
last_update_at: evaluator.last_update_at) last_update_at: evaluator.last_update_at)
end end
end end
trait :import_hard_failed do trait :import_hard_failed do
......
require 'spec_helper'
describe Gitlab::BackgroundMigration::PopulateImportState, :migration, schema: 20180430144643 do
let(:migration) { described_class.new }
let(:namespaces) { table(:namespaces) }
let(:projects) { table(:projects) }
let(:import_state) { table(:project_mirror_data) }
before do
namespaces.create(id: 1, name: 'gitlab-org', path: 'gitlab-org')
projects.create!(id: 1, namespace_id: 1, name: 'gitlab1',
path: 'gitlab1', import_error: "foo", import_status: :started,
import_url: generate(:url))
projects.create!(id: 2, namespace_id: 1, name: 'gitlab2', path: 'gitlab2',
import_status: :none, import_url: generate(:url))
projects.create!(id: 3, namespace_id: 1, name: 'gitlab3',
path: 'gitlab3', import_error: "bar", import_status: :failed,
import_url: generate(:url))
allow(BackgroundMigrationWorker).to receive(:perform_in)
end
it "creates new import_state records with project's import data" do
expect(projects.where.not(import_status: :none).count).to eq(2)
expect do
migration.perform(1, 3)
end.to change { import_state.all.count }.from(0).to(2)
expect(import_state.first.last_error).to eq("foo")
expect(import_state.last.last_error).to eq("bar")
expect(import_state.first.status).to eq("started")
expect(import_state.last.status).to eq("failed")
expect(projects.first.import_status).to eq("none")
expect(projects.last.import_status).to eq("none")
end
end
require 'spec_helper'
describe Gitlab::BackgroundMigration::RollbackImportStateData, :migration, schema: 20180430144643 do
let(:migration) { described_class.new }
let(:namespaces) { table(:namespaces) }
let(:projects) { table(:projects) }
let(:import_state) { table(:project_mirror_data) }
before do
namespaces.create(id: 1, name: 'gitlab-org', path: 'gitlab-org')
projects.create!(id: 1, namespace_id: 1, name: 'gitlab1', import_url: generate(:url))
projects.create!(id: 2, namespace_id: 1, name: 'gitlab2', path: 'gitlab2', import_url: generate(:url))
import_state.create!(id: 1, project_id: 1, status: :started, last_error: "foo")
import_state.create!(id: 2, project_id: 2, status: :failed)
allow(BackgroundMigrationWorker).to receive(:perform_in)
end
it "creates new import_state records with project's import data" do
migration.perform(1, 2)
expect(projects.first.import_status).to eq("started")
expect(projects.second.import_status).to eq("failed")
expect(projects.first.import_error).to eq("foo")
end
end
...@@ -12,6 +12,8 @@ describe Gitlab::GithubImport::ParallelImporter do ...@@ -12,6 +12,8 @@ describe Gitlab::GithubImport::ParallelImporter do
let(:importer) { described_class.new(project) } let(:importer) { described_class.new(project) }
before do before do
create(:import_state, :started, project: project)
expect(Gitlab::GithubImport::Stage::ImportRepositoryWorker) expect(Gitlab::GithubImport::Stage::ImportRepositoryWorker)
.to receive(:perform_async) .to receive(:perform_async)
.with(project.id) .with(project.id)
...@@ -34,8 +36,6 @@ describe Gitlab::GithubImport::ParallelImporter do ...@@ -34,8 +36,6 @@ describe Gitlab::GithubImport::ParallelImporter do
it 'updates the import JID of the project' do it 'updates the import JID of the project' do
importer.execute importer.execute
debugger
expect(project.reload.import_jid).to eq("github-importer/#{project.id}") expect(project.reload.import_jid).to eq("github-importer/#{project.id}")
end end
end end
......
require 'spec_helper'
require Rails.root.join('db', 'post_migrate', '20180430144643_migrate_import_attributes_data_from_projects_to_project_mirror_data.rb')
describe MigrateImportAttributesDataFromProjectsToProjectMirrorData, :sidekiq, :migration do
let(:namespaces) { table(:namespaces) }
let(:projects) { table(:projects) }
let(:import_state) { table(:project_mirror_data) }
before do
stub_const("#{described_class}::BATCH_SIZE", 1)
namespaces.create(id: 1, name: 'gitlab-org', path: 'gitlab-org')
projects.create!(id: 1, namespace_id: 1, name: 'gitlab1',
path: 'gitlab1', import_error: "foo", import_status: :started,
import_url: generate(:url))
projects.create!(id: 2, namespace_id: 1, name: 'gitlab2',
path: 'gitlab2', import_error: "bar", import_status: :failed,
import_url: generate(:url))
projects.create!(id: 3, namespace_id: 1, name: 'gitlab3', path: 'gitlab3', import_status: :none, import_url: generate(:url))
end
it 'schedules delayed background migrations in batches in bulk' do
Sidekiq::Testing.fake! do
Timecop.freeze do
expect(projects.where.not(import_status: :none).count).to eq(2)
subject.up
expect(BackgroundMigrationWorker.jobs.size).to eq 2
expect(described_class::UP_MIGRATION).to be_scheduled_delayed_migration(5.minutes, 1, 1)
expect(described_class::UP_MIGRATION).to be_scheduled_delayed_migration(10.minutes, 2, 2)
end
end
end
describe '#down' do
before do
import_state.create!(id: 1, project_id: 1, status: :started)
import_state.create!(id: 2, project_id: 2, status: :started)
end
it 'schedules delayed background migrations in batches in bulk for rollback' do
Sidekiq::Testing.fake! do
Timecop.freeze do
expect(import_state.where.not(status: :none).count).to eq(2)
subject.down
expect(BackgroundMigrationWorker.jobs.size).to eq 2
expect(described_class::DOWN_MIGRATION).to be_scheduled_delayed_migration(5.minutes, 1, 1)
expect(described_class::DOWN_MIGRATION).to be_scheduled_delayed_migration(10.minutes, 2, 2)
end
end
end
end
end
...@@ -107,7 +107,7 @@ describe Gitlab::GithubImport::AdvanceStageWorker, :clean_gitlab_redis_shared_st ...@@ -107,7 +107,7 @@ describe Gitlab::GithubImport::AdvanceStageWorker, :clean_gitlab_redis_shared_st
# This test is there to make sure we only select the columns we care # This test is there to make sure we only select the columns we care
# about. # about.
# TODO: enable this assertion back again # TODO: enable this assertion back again
#expect(found.attributes).to include({ 'id' => nil, 'import_jid' => '123' }) # expect(found.attributes).to include({ 'id' => nil, 'import_jid' => '123' })
end end
it 'returns nil if the project import is not running' do it 'returns nil if the project import is not running' do
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment