2019-07-25 01:21:37 -04:00
# frozen_string_literal: true
2017-12-07 10:33:30 -05:00
require 'spec_helper'
2020-09-21 20:09:59 -04:00
RSpec . describe Backup :: Repositories do
2017-12-07 10:33:30 -05:00
let ( :progress ) { StringIO . new }
2019-12-12 07:07:33 -05:00
2018-05-24 10:58:25 -04:00
subject { described_class . new ( progress ) }
2017-12-07 10:33:30 -05:00
before do
allow ( progress ) . to receive ( :puts )
allow ( progress ) . to receive ( :print )
2019-11-20 01:06:16 -05:00
allow_next_instance_of ( described_class ) do | instance |
allow ( instance ) . to receive ( :progress ) . and_return ( progress )
end
2017-12-07 10:33:30 -05:00
end
2020-08-25 23:10:11 -04:00
describe '#dump' do
2020-09-24 08:09:37 -04:00
let_it_be ( :projects ) { create_list ( :project , 5 , :repository ) }
2020-08-12 20:10:06 -04:00
2020-09-24 08:09:37 -04:00
RSpec . shared_examples 'creates repository bundles' do
specify :aggregate_failures do
2020-10-06 11:08:33 -04:00
# Add data to the wiki, design repositories, and snippets, so they will be included in the dump.
2020-09-24 08:09:37 -04:00
create ( :wiki_page , container : project )
2020-10-02 05:08:33 -04:00
create ( :design , :with_file , issue : create ( :issue , project : project ) )
2020-10-06 11:08:33 -04:00
project_snippet = create ( :project_snippet , :repository , project : project )
personal_snippet = create ( :personal_snippet , :repository , author : project . owner )
2020-08-12 20:10:06 -04:00
2020-09-21 20:09:59 -04:00
subject . dump ( max_concurrency : 1 , max_storage_concurrency : 1 )
2020-09-24 08:09:37 -04:00
expect ( File ) . to exist ( File . join ( Gitlab . config . backup . path , 'repositories' , project . disk_path + '.bundle' ) )
expect ( File ) . to exist ( File . join ( Gitlab . config . backup . path , 'repositories' , project . disk_path + '.wiki' + '.bundle' ) )
2020-10-02 05:08:33 -04:00
expect ( File ) . to exist ( File . join ( Gitlab . config . backup . path , 'repositories' , project . disk_path + '.design' + '.bundle' ) )
2020-10-06 11:08:33 -04:00
expect ( File ) . to exist ( File . join ( Gitlab . config . backup . path , 'repositories' , personal_snippet . disk_path + '.bundle' ) )
expect ( File ) . to exist ( File . join ( Gitlab . config . backup . path , 'repositories' , project_snippet . disk_path + '.bundle' ) )
2020-09-21 20:09:59 -04:00
end
2020-09-24 08:09:37 -04:00
end
2020-09-21 20:09:59 -04:00
2020-09-24 08:09:37 -04:00
context 'hashed storage' do
let_it_be ( :project ) { create ( :project , :repository ) }
it_behaves_like 'creates repository bundles'
end
context 'legacy storage' do
let_it_be ( :project ) { create ( :project , :repository , :legacy_storage ) }
it_behaves_like 'creates repository bundles'
end
context 'no concurrency' do
2020-08-12 20:10:06 -04:00
it 'creates the expected number of threads' do
expect ( Thread ) . not_to receive ( :new )
projects . each do | project |
expect ( subject ) . to receive ( :dump_project ) . with ( project ) . and_call_original
end
subject . dump ( max_concurrency : 1 , max_storage_concurrency : 1 )
2017-12-07 10:33:30 -05:00
end
2020-08-12 20:10:06 -04:00
describe 'command failure' do
it 'dump_project raises an error' do
allow ( subject ) . to receive ( :dump_project ) . and_raise ( IOError )
expect { subject . dump ( max_concurrency : 1 , max_storage_concurrency : 1 ) } . to raise_error ( IOError )
end
it 'project query raises an error' do
2020-09-04 05:08:38 -04:00
allow ( Project ) . to receive_message_chain ( :includes , :find_each ) . and_raise ( ActiveRecord :: StatementTimeout )
2020-08-12 20:10:06 -04:00
expect { subject . dump ( max_concurrency : 1 , max_storage_concurrency : 1 ) } . to raise_error ( ActiveRecord :: StatementTimeout )
end
end
2020-09-04 05:08:38 -04:00
it 'avoids N+1 database queries' do
control_count = ActiveRecord :: QueryRecorder . new do
subject . dump ( max_concurrency : 1 , max_storage_concurrency : 1 )
end . count
2020-09-24 08:09:37 -04:00
create_list ( :project , 2 , :repository )
2020-09-04 05:08:38 -04:00
expect do
subject . dump ( max_concurrency : 1 , max_storage_concurrency : 1 )
end . not_to exceed_query_limit ( control_count )
end
2020-08-12 20:10:06 -04:00
end
[ 4 , 10 ] . each do | max_storage_concurrency |
2020-09-07 02:08:35 -04:00
context " max_storage_concurrency #{ max_storage_concurrency } " , quarantine : 'https://gitlab.com/gitlab-org/gitlab/-/issues/241701' do
2020-09-24 08:09:37 -04:00
let ( :storage_keys ) { %w[ default test_second_storage ] }
before do
allow ( Gitlab . config . repositories . storages ) . to receive ( :keys ) . and_return ( storage_keys )
end
2020-08-12 20:10:06 -04:00
it 'creates the expected number of threads' do
expect ( Thread ) . to receive ( :new )
. exactly ( storage_keys . length * ( max_storage_concurrency + 1 ) ) . times
. and_call_original
projects . each do | project |
expect ( subject ) . to receive ( :dump_project ) . with ( project ) . and_call_original
end
subject . dump ( max_concurrency : 1 , max_storage_concurrency : max_storage_concurrency )
end
it 'creates the expected number of threads with extra max concurrency' do
expect ( Thread ) . to receive ( :new )
. exactly ( storage_keys . length * ( max_storage_concurrency + 1 ) ) . times
. and_call_original
projects . each do | project |
expect ( subject ) . to receive ( :dump_project ) . with ( project ) . and_call_original
end
subject . dump ( max_concurrency : 3 , max_storage_concurrency : max_storage_concurrency )
end
describe 'command failure' do
it 'dump_project raises an error' do
allow ( subject ) . to receive ( :dump_project )
. and_raise ( IOError )
expect { subject . dump ( max_concurrency : 1 , max_storage_concurrency : max_storage_concurrency ) } . to raise_error ( IOError )
end
it 'project query raises an error' do
2020-09-04 05:08:38 -04:00
allow ( Project ) . to receive_message_chain ( :for_repository_storage , :includes , :find_each ) . and_raise ( ActiveRecord :: StatementTimeout )
2020-08-12 20:10:06 -04:00
expect { subject . dump ( max_concurrency : 1 , max_storage_concurrency : max_storage_concurrency ) } . to raise_error ( ActiveRecord :: StatementTimeout )
end
context 'misconfigured storages' do
let ( :storage_keys ) { %w[ test_second_storage ] }
it 'raises an error' do
expect { subject . dump ( max_concurrency : 1 , max_storage_concurrency : max_storage_concurrency ) } . to raise_error ( Backup :: Error , 'repositories.storages in gitlab.yml is misconfigured' )
end
end
end
2020-09-04 05:08:38 -04:00
it 'avoids N+1 database queries' do
control_count = ActiveRecord :: QueryRecorder . new do
subject . dump ( max_concurrency : 1 , max_storage_concurrency : max_storage_concurrency )
end . count
2020-09-24 08:09:37 -04:00
create_list ( :project , 2 , :repository )
2020-09-04 05:08:38 -04:00
expect do
subject . dump ( max_concurrency : 1 , max_storage_concurrency : max_storage_concurrency )
end . not_to exceed_query_limit ( control_count )
end
2017-12-07 10:33:30 -05:00
end
end
end
describe '#restore' do
2020-09-24 08:09:37 -04:00
let_it_be ( :project ) { create ( :project ) }
it 'restores repositories from bundles' , :aggregate_failures do
next_path_to_bundle = [
Rails . root . join ( 'spec/fixtures/lib/backup/project_repo.bundle' ) ,
2020-10-02 05:08:33 -04:00
Rails . root . join ( 'spec/fixtures/lib/backup/wiki_repo.bundle' ) ,
Rails . root . join ( 'spec/fixtures/lib/backup/design_repo.bundle' )
2020-09-24 08:09:37 -04:00
] . to_enum
allow_next_instance_of ( described_class :: BackupRestore ) do | backup_restore |
allow ( backup_restore ) . to receive ( :path_to_bundle ) . and_return ( next_path_to_bundle . next )
end
subject . restore
collect_commit_shas = - > ( repo ) { repo . commits ( 'master' , limit : 10 ) . map ( & :sha ) }
expect ( collect_commit_shas . call ( project . repository ) ) . to eq ( [ '393a7d860a5a4c3cc736d7eb00604e3472bb95ec' ] )
expect ( collect_commit_shas . call ( project . wiki . repository ) ) . to eq ( [ 'c74b9948d0088d703ee1fafeddd9ed9add2901ea' ] )
2020-10-02 05:08:33 -04:00
expect ( collect_commit_shas . call ( project . design_repository ) ) . to eq ( [ 'c3cd4d7bd73a51a0f22045c3a4c871c435dc959d' ] )
2020-09-24 08:09:37 -04:00
end
2018-03-02 13:14:19 -05:00
2017-12-07 10:33:30 -05:00
describe 'command failure' do
before do
2020-03-16 08:09:12 -04:00
expect ( Project ) . to receive ( :find_each ) . and_yield ( project )
2020-09-21 20:09:59 -04:00
2020-10-02 05:08:33 -04:00
allow_next_instance_of ( DesignManagement :: Repository ) do | repository |
allow ( repository ) . to receive ( :create_repository ) { raise 'Fail in tests' }
end
2020-09-21 20:09:59 -04:00
allow_next_instance_of ( Repository ) do | repository |
allow ( repository ) . to receive ( :create_repository ) { raise 'Fail in tests' }
end
2017-12-07 10:33:30 -05:00
end
2017-12-01 08:58:49 -05:00
context 'hashed storage' do
it 'shows the appropriate error' do
2018-03-02 13:14:19 -05:00
subject . restore
2017-12-07 10:33:30 -05:00
2020-09-21 20:09:59 -04:00
expect ( progress ) . to have_received ( :puts ) . with ( " [Failed] restoring #{ project . full_path } ( #{ project . disk_path } ) " )
2017-12-01 08:58:49 -05:00
end
end
context 'legacy storage' do
2020-09-21 20:09:59 -04:00
let_it_be ( :project ) { create ( :project , :legacy_storage ) }
2017-12-01 08:58:49 -05:00
it 'shows the appropriate error' do
2018-03-02 13:14:19 -05:00
subject . restore
2017-12-01 08:58:49 -05:00
2020-09-21 20:09:59 -04:00
expect ( progress ) . to have_received ( :puts ) . with ( " [Failed] restoring #{ project . full_path } ( #{ project . disk_path } ) " )
2017-12-01 08:58:49 -05:00
end
2017-12-07 10:33:30 -05:00
end
end
2018-12-10 03:31:28 -05:00
context 'restoring object pools' do
2019-10-23 05:06:03 -04:00
it 'schedules restoring of the pool' , :sidekiq_might_not_need_inline do
2018-12-10 03:31:28 -05:00
pool_repository = create ( :pool_repository , :failed )
pool_repository . delete_object_pool
subject . restore
pool_repository . reload
expect ( pool_repository ) . not_to be_failed
expect ( pool_repository . object_pool . exists? ) . to be ( true )
end
end
2020-02-12 19:08:46 -05:00
it 'cleans existing repositories' do
2020-10-02 05:08:33 -04:00
expect_next_instance_of ( DesignManagement :: Repository ) do | repository |
expect ( repository ) . to receive ( :remove )
end
2020-09-21 20:09:59 -04:00
expect ( Repository ) . to receive ( :new ) . twice . and_wrap_original do | method , * original_args |
repository = method . call ( * original_args )
2020-02-12 19:08:46 -05:00
2020-09-21 20:09:59 -04:00
expect ( repository ) . to receive ( :remove )
2020-02-12 19:08:46 -05:00
2020-09-21 20:09:59 -04:00
repository
2020-02-12 19:08:46 -05:00
end
subject . restore
2017-12-07 10:33:30 -05:00
end
end
end