debian-mirror-gitlab/spec/lib/backup/repositories_spec.rb

264 lines
9.6 KiB
Ruby
Raw Normal View History

2021-01-03 14:25:43 +05:30
# frozen_string_literal: true
require 'spec_helper'
RSpec.describe Backup::Repositories do
2021-09-04 01:27:46 +05:30
let(:progress) { spy(:stdout) }
2021-09-30 23:02:18 +05:30
let(:parallel_enqueue) { true }
let(:strategy) { spy(:strategy, parallel_enqueue?: parallel_enqueue) }
2022-04-04 11:22:00 +05:30
let(:max_concurrency) { 1 }
let(:max_storage_concurrency) { 1 }
2022-05-07 20:08:51 +05:30
let(:destination) { 'repositories' }
2022-04-04 11:22:00 +05:30
subject do
described_class.new(
progress,
strategy: strategy,
max_concurrency: max_concurrency,
max_storage_concurrency: max_storage_concurrency
)
end
2021-01-03 14:25:43 +05:30
describe '#dump' do
let_it_be(:projects) { create_list(:project, 5, :repository) }
RSpec.shared_examples 'creates repository bundles' do
2021-09-04 01:27:46 +05:30
it 'calls enqueue for each repository type', :aggregate_failures do
2021-01-03 14:25:43 +05:30
project_snippet = create(:project_snippet, :repository, project: project)
2022-04-04 11:22:00 +05:30
personal_snippet = create(:personal_snippet, :repository, author: project.first_owner)
2021-01-03 14:25:43 +05:30
2022-05-07 20:08:51 +05:30
subject.dump(destination)
2021-01-03 14:25:43 +05:30
2022-05-07 20:08:51 +05:30
expect(strategy).to have_received(:start).with(:create, destination)
2021-09-04 01:27:46 +05:30
expect(strategy).to have_received(:enqueue).with(project, Gitlab::GlRepository::PROJECT)
expect(strategy).to have_received(:enqueue).with(project, Gitlab::GlRepository::WIKI)
expect(strategy).to have_received(:enqueue).with(project, Gitlab::GlRepository::DESIGN)
expect(strategy).to have_received(:enqueue).with(project_snippet, Gitlab::GlRepository::SNIPPET)
expect(strategy).to have_received(:enqueue).with(personal_snippet, Gitlab::GlRepository::SNIPPET)
2022-03-02 08:16:31 +05:30
expect(strategy).to have_received(:finish!)
2021-01-03 14:25:43 +05:30
end
end
context 'hashed storage' do
let_it_be(:project) { create(:project, :repository) }
it_behaves_like 'creates repository bundles'
end
context 'legacy storage' do
let_it_be(:project) { create(:project, :repository, :legacy_storage) }
it_behaves_like 'creates repository bundles'
end
context 'no concurrency' do
it 'creates the expected number of threads' do
expect(Thread).not_to receive(:new)
2022-05-07 20:08:51 +05:30
expect(strategy).to receive(:start).with(:create, destination)
2021-01-03 14:25:43 +05:30
projects.each do |project|
2021-09-04 01:27:46 +05:30
expect(strategy).to receive(:enqueue).with(project, Gitlab::GlRepository::PROJECT)
2021-01-03 14:25:43 +05:30
end
2022-03-02 08:16:31 +05:30
expect(strategy).to receive(:finish!)
2021-01-03 14:25:43 +05:30
2022-05-07 20:08:51 +05:30
subject.dump(destination)
2021-01-03 14:25:43 +05:30
end
describe 'command failure' do
2021-09-04 01:27:46 +05:30
it 'enqueue_project raises an error' do
allow(strategy).to receive(:enqueue).with(anything, Gitlab::GlRepository::PROJECT).and_raise(IOError)
2021-01-03 14:25:43 +05:30
2022-05-07 20:08:51 +05:30
expect { subject.dump(destination) }.to raise_error(IOError)
2021-01-03 14:25:43 +05:30
end
it 'project query raises an error' do
allow(Project).to receive_message_chain(:includes, :find_each).and_raise(ActiveRecord::StatementTimeout)
2022-05-07 20:08:51 +05:30
expect { subject.dump(destination) }.to raise_error(ActiveRecord::StatementTimeout)
2021-01-03 14:25:43 +05:30
end
end
it 'avoids N+1 database queries' do
control_count = ActiveRecord::QueryRecorder.new do
2022-05-07 20:08:51 +05:30
subject.dump(destination)
2021-01-03 14:25:43 +05:30
end.count
create_list(:project, 2, :repository)
expect do
2022-05-07 20:08:51 +05:30
subject.dump(destination)
2021-01-03 14:25:43 +05:30
end.not_to exceed_query_limit(control_count)
end
end
2021-09-30 23:02:18 +05:30
context 'concurrency with a strategy without parallel enqueueing support' do
let(:parallel_enqueue) { false }
2022-04-04 11:22:00 +05:30
let(:max_concurrency) { 2 }
let(:max_storage_concurrency) { 2 }
2021-09-30 23:02:18 +05:30
it 'enqueues all projects sequentially' do
expect(Thread).not_to receive(:new)
2022-05-07 20:08:51 +05:30
expect(strategy).to receive(:start).with(:create, destination)
2021-09-30 23:02:18 +05:30
projects.each do |project|
expect(strategy).to receive(:enqueue).with(project, Gitlab::GlRepository::PROJECT)
end
2022-03-02 08:16:31 +05:30
expect(strategy).to receive(:finish!)
2021-09-30 23:02:18 +05:30
2022-05-07 20:08:51 +05:30
subject.dump(destination)
2021-09-30 23:02:18 +05:30
end
end
2021-01-03 14:25:43 +05:30
[4, 10].each do |max_storage_concurrency|
context "max_storage_concurrency #{max_storage_concurrency}", quarantine: 'https://gitlab.com/gitlab-org/gitlab/-/issues/241701' do
let(:storage_keys) { %w[default test_second_storage] }
2022-04-04 11:22:00 +05:30
let(:max_storage_concurrency) { max_storage_concurrency }
2021-01-03 14:25:43 +05:30
before do
allow(Gitlab.config.repositories.storages).to receive(:keys).and_return(storage_keys)
end
it 'creates the expected number of threads' do
expect(Thread).to receive(:new)
.exactly(storage_keys.length * (max_storage_concurrency + 1)).times
.and_call_original
2022-05-07 20:08:51 +05:30
expect(strategy).to receive(:start).with(:create, destination)
2021-01-03 14:25:43 +05:30
projects.each do |project|
2021-09-04 01:27:46 +05:30
expect(strategy).to receive(:enqueue).with(project, Gitlab::GlRepository::PROJECT)
2021-01-03 14:25:43 +05:30
end
2022-03-02 08:16:31 +05:30
expect(strategy).to receive(:finish!)
2021-01-03 14:25:43 +05:30
2022-05-07 20:08:51 +05:30
subject.dump(destination)
2021-01-03 14:25:43 +05:30
end
2022-04-04 11:22:00 +05:30
context 'with extra max concurrency' do
let(:max_concurrency) { 3 }
2021-01-03 14:25:43 +05:30
2022-04-04 11:22:00 +05:30
it 'creates the expected number of threads' do
expect(Thread).to receive(:new)
.exactly(storage_keys.length * (max_storage_concurrency + 1)).times
.and_call_original
2021-01-03 14:25:43 +05:30
2022-05-07 20:08:51 +05:30
expect(strategy).to receive(:start).with(:create, destination)
2022-04-04 11:22:00 +05:30
projects.each do |project|
expect(strategy).to receive(:enqueue).with(project, Gitlab::GlRepository::PROJECT)
end
expect(strategy).to receive(:finish!)
2022-05-07 20:08:51 +05:30
subject.dump(destination)
2022-04-04 11:22:00 +05:30
end
2021-01-03 14:25:43 +05:30
end
describe 'command failure' do
2021-09-04 01:27:46 +05:30
it 'enqueue_project raises an error' do
allow(strategy).to receive(:enqueue).and_raise(IOError)
2021-01-03 14:25:43 +05:30
2022-05-07 20:08:51 +05:30
expect { subject.dump(destination) }.to raise_error(IOError)
2021-01-03 14:25:43 +05:30
end
it 'project query raises an error' do
allow(Project).to receive_message_chain(:for_repository_storage, :includes, :find_each).and_raise(ActiveRecord::StatementTimeout)
2022-05-07 20:08:51 +05:30
expect { subject.dump(destination) }.to raise_error(ActiveRecord::StatementTimeout)
2021-01-03 14:25:43 +05:30
end
context 'misconfigured storages' do
let(:storage_keys) { %w[test_second_storage] }
it 'raises an error' do
2022-05-07 20:08:51 +05:30
expect { subject.dump(destination) }.to raise_error(Backup::Error, 'repositories.storages in gitlab.yml is misconfigured')
2021-01-03 14:25:43 +05:30
end
end
end
it 'avoids N+1 database queries' do
control_count = ActiveRecord::QueryRecorder.new do
2022-05-07 20:08:51 +05:30
subject.dump(destination)
2021-01-03 14:25:43 +05:30
end.count
create_list(:project, 2, :repository)
expect do
2022-05-07 20:08:51 +05:30
subject.dump(destination)
2021-01-03 14:25:43 +05:30
end.not_to exceed_query_limit(control_count)
end
end
end
end
describe '#restore' do
let_it_be(:project) { create(:project) }
2022-04-04 11:22:00 +05:30
let_it_be(:personal_snippet) { create(:personal_snippet, author: project.first_owner) }
let_it_be(:project_snippet) { create(:project_snippet, project: project, author: project.first_owner) }
2021-01-03 14:25:43 +05:30
2021-09-04 01:27:46 +05:30
it 'calls enqueue for each repository type', :aggregate_failures do
2022-05-07 20:08:51 +05:30
subject.restore(destination)
2021-01-03 14:25:43 +05:30
2022-05-07 20:08:51 +05:30
expect(strategy).to have_received(:start).with(:restore, destination)
2021-09-04 01:27:46 +05:30
expect(strategy).to have_received(:enqueue).with(project, Gitlab::GlRepository::PROJECT)
expect(strategy).to have_received(:enqueue).with(project, Gitlab::GlRepository::WIKI)
expect(strategy).to have_received(:enqueue).with(project, Gitlab::GlRepository::DESIGN)
expect(strategy).to have_received(:enqueue).with(project_snippet, Gitlab::GlRepository::SNIPPET)
expect(strategy).to have_received(:enqueue).with(personal_snippet, Gitlab::GlRepository::SNIPPET)
2022-03-02 08:16:31 +05:30
expect(strategy).to have_received(:finish!)
2021-01-03 14:25:43 +05:30
end
context 'restoring object pools' do
it 'schedules restoring of the pool', :sidekiq_might_not_need_inline do
pool_repository = create(:pool_repository, :failed)
pool_repository.delete_object_pool
2022-05-07 20:08:51 +05:30
subject.restore(destination)
2021-01-03 14:25:43 +05:30
pool_repository.reload
expect(pool_repository).not_to be_failed
expect(pool_repository.object_pool.exists?).to be(true)
end
2021-04-17 20:07:23 +05:30
it 'skips pools with no source project, :sidekiq_might_not_need_inline' do
pool_repository = create(:pool_repository, state: :obsolete)
pool_repository.update_column(:source_project_id, nil)
2022-05-07 20:08:51 +05:30
subject.restore(destination)
2021-04-17 20:07:23 +05:30
pool_repository.reload
expect(pool_repository).to be_obsolete
end
2021-01-03 14:25:43 +05:30
end
2021-09-04 01:27:46 +05:30
context 'cleanup snippets' do
2021-01-03 14:25:43 +05:30
before do
create(:snippet_repository, snippet: personal_snippet)
create(:snippet_repository, snippet: project_snippet)
2021-09-04 01:27:46 +05:30
error_response = ServiceResponse.error(message: "Repository has more than one branch")
allow(Snippets::RepositoryValidationService).to receive_message_chain(:new, :execute).and_return(error_response)
2021-01-03 14:25:43 +05:30
end
2021-09-04 01:27:46 +05:30
it 'shows the appropriate error' do
2022-05-07 20:08:51 +05:30
subject.restore(destination)
2021-01-03 14:25:43 +05:30
2021-09-04 01:27:46 +05:30
expect(progress).to have_received(:puts).with("Snippet #{personal_snippet.full_path} can't be restored: Repository has more than one branch")
expect(progress).to have_received(:puts).with("Snippet #{project_snippet.full_path} can't be restored: Repository has more than one branch")
2021-01-03 14:25:43 +05:30
end
2021-09-04 01:27:46 +05:30
it 'removes the snippets from the DB' do
2022-05-07 20:08:51 +05:30
expect { subject.restore(destination) }.to change(PersonalSnippet, :count).by(-1)
2021-09-04 01:27:46 +05:30
.and change(ProjectSnippet, :count).by(-1)
.and change(SnippetRepository, :count).by(-2)
end
2021-01-03 14:25:43 +05:30
2021-09-04 01:27:46 +05:30
it 'removes the repository from disk' do
gitlab_shell = Gitlab::Shell.new
shard_name = personal_snippet.repository.shard
path = personal_snippet.disk_path + '.git'
2021-01-03 14:25:43 +05:30
2022-05-07 20:08:51 +05:30
subject.restore(destination)
2021-01-03 14:25:43 +05:30
2021-09-04 01:27:46 +05:30
expect(gitlab_shell.repository_exists?(shard_name, path)).to eq false
2021-01-03 14:25:43 +05:30
end
end
end
end