Commit 4fcec8a4 authored by Andreas Brandl's avatar Andreas Brandl

Random index selection strategy

This adds a random selection strategy to rebuild indexes. We tackle 2
indexes at a time and select rather large ones randomly. This is subject
to improvement later but it'll get us going (basically removing the need
to specify an index name manually).

Also, as suggested earlier, this adds a view to conveniently access
information about indexes and introduces a corresponding ActiveRecord
model.
parent 8a084bf2
---
title: 'Add database view for postgres indexes'
merge_request: 42967
author:
type: other
# frozen_string_literal: true
class AddPostgresIndexView < ActiveRecord::Migration[6.0]
DOWNTIME = false
def up
execute(<<~SQL)
CREATE VIEW postgres_indexes AS
SELECT
pg_namespace.nspname || '.' || pg_class.relname as identifier,
pg_index.indexrelid,
pg_namespace.nspname as schema,
pg_class.relname as name,
pg_index.indisunique as unique,
pg_index.indisvalid as valid_index,
pg_class.relispartition as partitioned,
pg_indexes.indexdef as definition,
pg_relation_size(pg_class.oid) as ondisk_size_bytes
FROM pg_index
INNER JOIN pg_class ON pg_class.oid = pg_index.indexrelid
INNER JOIN pg_namespace ON pg_class.relnamespace = pg_namespace.oid
INNER JOIN pg_indexes ON pg_class.relname = pg_indexes.indexname
WHERE pg_namespace.nspname <> 'pg_catalog'
SQL
end
def down
execute(<<~SQL)
DROP VIEW postgres_indexes
SQL
end
end
705d010620b1aa95e86c8fb5fb9175fe77778376d228003e9fd2c8d0bb20a347
\ No newline at end of file
...@@ -14411,6 +14411,22 @@ CREATE SEQUENCE pool_repositories_id_seq ...@@ -14411,6 +14411,22 @@ CREATE SEQUENCE pool_repositories_id_seq
ALTER SEQUENCE pool_repositories_id_seq OWNED BY pool_repositories.id; ALTER SEQUENCE pool_repositories_id_seq OWNED BY pool_repositories.id;
CREATE VIEW postgres_indexes AS
SELECT (((pg_namespace.nspname)::text || '.'::text) || (pg_class.relname)::text) AS identifier,
pg_index.indexrelid,
pg_namespace.nspname AS schema,
pg_class.relname AS name,
pg_index.indisunique AS "unique",
pg_index.indisvalid AS valid_index,
pg_class.relispartition AS partitioned,
pg_indexes.indexdef AS definition,
pg_relation_size((pg_class.oid)::regclass) AS ondisk_size_bytes
FROM (((pg_index
JOIN pg_class ON ((pg_class.oid = pg_index.indexrelid)))
JOIN pg_namespace ON ((pg_class.relnamespace = pg_namespace.oid)))
JOIN pg_indexes ON ((pg_class.relname = pg_indexes.indexname)))
WHERE (pg_namespace.nspname <> 'pg_catalog'::name);
CREATE TABLE programming_languages ( CREATE TABLE programming_languages (
id integer NOT NULL, id integer NOT NULL,
name character varying NOT NULL, name character varying NOT NULL,
......
# frozen_string_literal: true
module Gitlab
module Database
class PostgresIndex < ActiveRecord::Base
self.table_name = 'postgres_indexes'
self.primary_key = 'identifier'
scope :by_identifier, ->(identifier) do
raise ArgumentError, "Index name is not fully qualified with a schema: #{identifier}" unless identifier =~ /^\w+\.\w+$/
find(identifier)
end
scope :non_unique, -> { where(unique: false) }
scope :non_partitioned, -> { where(partitioned: false) }
scope :random_few, ->(how_many) do
limit(how_many).order(Arel.sql('RANDOM()'))
end
def to_s
name
end
end
end
end
# frozen_string_literal: true
module Gitlab
module Database
module Reindexing
def self.perform(index_selector)
Array.wrap(index_selector).each do |index|
ConcurrentReindex.new(index).perform
end
end
end
end
end
...@@ -22,6 +22,9 @@ module Gitlab ...@@ -22,6 +22,9 @@ module Gitlab
def perform def perform
raise ReindexError, 'UNIQUE indexes are currently not supported' if index.unique? raise ReindexError, 'UNIQUE indexes are currently not supported' if index.unique?
raise ReindexError, 'partitioned indexes are currently not supported' if index.partitioned?
logger.info "Starting reindex of #{index}"
with_rebuilt_index do |replacement_index| with_rebuilt_index do |replacement_index|
swap_index(replacement_index) swap_index(replacement_index)
...@@ -31,12 +34,13 @@ module Gitlab ...@@ -31,12 +34,13 @@ module Gitlab
private private
def with_rebuilt_index def with_rebuilt_index
if Gitlab::Database::PostgresIndex.find_by(schema: index.schema, name: replacement_index_name)
logger.debug("dropping dangling index from previous run (if it exists): #{replacement_index_name}") logger.debug("dropping dangling index from previous run (if it exists): #{replacement_index_name}")
remove_replacement_index remove_index(index.schema, replacement_index_name)
end
create_replacement_index_statement = index.definition create_replacement_index_statement = index.definition
.sub(/CREATE INDEX/, 'CREATE INDEX CONCURRENTLY') .sub(/CREATE INDEX #{index.name}/, "CREATE INDEX CONCURRENTLY #{replacement_index_name}")
.sub(/#{index.name}/, replacement_index_name)
logger.info("creating replacement index #{replacement_index_name}") logger.info("creating replacement index #{replacement_index_name}")
logger.debug("replacement index definition: #{create_replacement_index_statement}") logger.debug("replacement index definition: #{create_replacement_index_statement}")
...@@ -45,55 +49,57 @@ module Gitlab ...@@ -45,55 +49,57 @@ module Gitlab
connection.execute(create_replacement_index_statement) connection.execute(create_replacement_index_statement)
end end
replacement_index = Index.find_with_schema("#{index.schema}.#{replacement_index_name}") replacement_index = Gitlab::Database::PostgresIndex.find_by(schema: index.schema, name: replacement_index_name)
unless replacement_index.valid? unless replacement_index.valid_index?
message = 'replacement index was created as INVALID' message = 'replacement index was created as INVALID'
logger.error("#{message}, cleaning up") logger.error("#{message}, cleaning up")
raise ReindexError, "failed to reindex #{index}: #{message}" raise ReindexError, "failed to reindex #{index}: #{message}"
end end
yield replacement_index yield replacement_index
rescue Gitlab::Database::WithLockRetries::AttemptsExhaustedError => e
logger.error('failed to obtain the required database locks to swap the indexes, cleaning up')
raise ReindexError, e.message
rescue ActiveRecord::ActiveRecordError, PG::Error => e
logger.error("database error while attempting reindex of #{index}: #{e.message}")
raise ReindexError, e.message
ensure ensure
logger.info("dropping unneeded replacement index: #{replacement_index_name}") begin
remove_replacement_index remove_index(index.schema, replacement_index_name)
rescue => e
logger.error(e)
end
end end
def swap_index(replacement_index) def swap_index(replacement_index)
replaced_index_name = constrained_index_name(REPLACED_INDEX_PREFIX)
logger.info("swapping replacement index #{replacement_index} with #{index}") logger.info("swapping replacement index #{replacement_index} with #{index}")
with_lock_retries do with_lock_retries do
rename_index(index.name, replaced_index_name) rename_index(index.schema, index.name, replaced_index_name)
rename_index(replacement_index.name, index.name) rename_index(replacement_index.schema, replacement_index.name, index.name)
rename_index(replaced_index_name, replacement_index.name) rename_index(index.schema, replaced_index_name, replacement_index.name)
end end
end end
def rename_index(old_index_name, new_index_name) def rename_index(schema, old_index_name, new_index_name)
connection.execute("ALTER INDEX #{old_index_name} RENAME TO #{new_index_name}") connection.execute(<<~SQL)
ALTER INDEX #{quote_table_name(schema)}.#{quote_table_name(old_index_name)}
RENAME TO #{quote_table_name(new_index_name)}
SQL
end end
def remove_replacement_index def remove_index(schema, name)
logger.info("Removing index #{schema}.#{name}")
disable_statement_timeout do disable_statement_timeout do
connection.execute("DROP INDEX CONCURRENTLY IF EXISTS #{replacement_index_name}") connection.execute(<<~SQL)
DROP INDEX CONCURRENTLY
IF EXISTS #{quote_table_name(schema)}.#{quote_table_name(name)}
SQL
end end
end end
def replacement_index_name def replacement_index_name
@replacement_index_name ||= constrained_index_name(TEMPORARY_INDEX_PREFIX) @replacement_index_name ||= "#{TEMPORARY_INDEX_PREFIX}#{index.indexrelid}"
end end
def constrained_index_name(prefix) def replaced_index_name
"#{prefix}#{index.name}".slice(0, PG_IDENTIFIER_LENGTH) @replaced_index_name ||= "#{REPLACED_INDEX_PREFIX}#{index.indexrelid}"
end end
def with_lock_retries(&block) def with_lock_retries(&block)
...@@ -102,7 +108,7 @@ module Gitlab ...@@ -102,7 +108,7 @@ module Gitlab
Gitlab::Database::WithLockRetries.new(**arguments).run(raise_on_exhaustion: true, &block) Gitlab::Database::WithLockRetries.new(**arguments).run(raise_on_exhaustion: true, &block)
end end
delegate :execute, to: :connection delegate :execute, :quote_table_name, to: :connection
def connection def connection
@connection ||= ActiveRecord::Base.connection @connection ||= ActiveRecord::Base.connection
end end
......
# frozen_string_literal: true
module Gitlab
module Database
module Reindexing
class Index
def self.find_with_schema(full_name)
raise ArgumentError, "Index name is not fully qualified with a schema: #{full_name}" unless full_name =~ /^\w+\.\w+$/
schema, index = full_name.split('.')
record = ActiveRecord::Base.connection.select_one(<<~SQL)
SELECT
pg_index.indisunique as is_unique,
pg_index.indisvalid as is_valid,
pg_indexes.indexdef as definition,
pg_namespace.nspname as schema,
pg_class.relname as name
FROM pg_index
INNER JOIN pg_class ON pg_class.oid = pg_index.indexrelid
INNER JOIN pg_namespace ON pg_class.relnamespace = pg_namespace.oid
INNER JOIN pg_indexes ON pg_class.relname = pg_indexes.indexname
WHERE pg_namespace.nspname = #{ActiveRecord::Base.connection.quote(schema)}
AND pg_class.relname = #{ActiveRecord::Base.connection.quote(index)}
SQL
return unless record
new(OpenStruct.new(record))
end
delegate :definition, :schema, :name, to: :@attrs
def initialize(attrs)
@attrs = attrs
end
def unique?
@attrs.is_unique
end
def valid?
@attrs.is_valid
end
def to_s
name
end
end
end
end
end
...@@ -174,14 +174,16 @@ namespace :gitlab do ...@@ -174,14 +174,16 @@ namespace :gitlab do
exit exit
end end
raise ArgumentError, 'must give the index name to reindex' unless args[:index_name] indexes = if args[:index_name]
Gitlab::Database::PostgresIndex.by_identifier(args[:index_name])
index = Gitlab::Database::Reindexing::Index.find_with_schema(args[:index_name]) else
Gitlab::Database::PostgresIndex.non_unique.non_partitioned.random_few(2)
raise ArgumentError, "Given index does not exist: #{args[:index_name]}" unless index end
puts "Rebuilding index #{index}".color(:green) Gitlab::Database::Reindexing.perform(indexes)
Gitlab::Database::Reindexing::ConcurrentReindex.new(index).perform rescue => e
Gitlab::AppLogger.error(e)
raise
end end
end end
end end
...@@ -2,7 +2,7 @@ ...@@ -2,7 +2,7 @@
require 'spec_helper' require 'spec_helper'
RSpec.describe Gitlab::Database::Reindexing::Index do RSpec.describe Gitlab::Database::PostgresIndex do
before do before do
ActiveRecord::Base.connection.execute(<<~SQL) ActiveRecord::Base.connection.execute(<<~SQL)
CREATE INDEX foo_idx ON public.users (name); CREATE INDEX foo_idx ON public.users (name);
...@@ -13,16 +13,16 @@ RSpec.describe Gitlab::Database::Reindexing::Index do ...@@ -13,16 +13,16 @@ RSpec.describe Gitlab::Database::Reindexing::Index do
end end
def find(name) def find(name)
described_class.find_with_schema(name) described_class.by_identifier(name)
end end
describe '.find_with_schema' do describe '.by_identifier' do
it 'returns an instance of Gitlab::Database::Reindexing::Index when the index is present' do it 'finds the index' do
expect(find('public.foo_idx')).to be_a(Gitlab::Database::Reindexing::Index) expect(find('public.foo_idx')).to be_a(Gitlab::Database::PostgresIndex)
end end
it 'returns nil if the index is not present' do it 'raises an error if not found' do
expect(find('public.idontexist')).to be_nil expect { find('public.idontexist') }.to raise_error(ActiveRecord::RecordNotFound)
end end
it 'raises ArgumentError if given a non-fully qualified index name' do it 'raises ArgumentError if given a non-fully qualified index name' do
...@@ -30,6 +30,24 @@ RSpec.describe Gitlab::Database::Reindexing::Index do ...@@ -30,6 +30,24 @@ RSpec.describe Gitlab::Database::Reindexing::Index do
end end
end end
describe '#non_unique' do
it 'only non-unique indexes' do
expect(described_class.non_unique).to all(have_attributes(unique: false))
end
end
describe '#non_partitioned' do
it 'only non partitioned indexes ' do
expect(described_class.non_partitioned).to all(have_attributes(partitioned: false))
end
end
describe '#random_few' do
it 'limits to two records by default' do
expect(described_class.random_few(2).size).to eq(2)
end
end
describe '#unique?' do describe '#unique?' do
it 'returns true for a unique index' do it 'returns true for a unique index' do
expect(find('public.bar_key')).to be_unique expect(find('public.bar_key')).to be_unique
...@@ -44,9 +62,9 @@ RSpec.describe Gitlab::Database::Reindexing::Index do ...@@ -44,9 +62,9 @@ RSpec.describe Gitlab::Database::Reindexing::Index do
end end
end end
describe '#valid?' do describe '#valid_index?' do
it 'returns true if the index is valid' do it 'returns true if the index is invalid' do
expect(find('public.foo_idx')).to be_valid expect(find('public.foo_idx')).to be_valid_index
end end
it 'returns false if the index is marked as invalid' do it 'returns false if the index is marked as invalid' do
...@@ -56,7 +74,7 @@ RSpec.describe Gitlab::Database::Reindexing::Index do ...@@ -56,7 +74,7 @@ RSpec.describe Gitlab::Database::Reindexing::Index do
WHERE pg_class.relname = 'foo_idx' AND pg_index.indexrelid = pg_class.oid WHERE pg_class.relname = 'foo_idx' AND pg_index.indexrelid = pg_class.oid
SQL SQL
expect(find('public.foo_idx')).not_to be_valid expect(find('public.foo_idx')).not_to be_valid_index
end end
end end
......
...@@ -8,7 +8,7 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do ...@@ -8,7 +8,7 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do
let(:table_name) { '_test_reindex_table' } let(:table_name) { '_test_reindex_table' }
let(:column_name) { '_test_column' } let(:column_name) { '_test_column' }
let(:index_name) { '_test_reindex_index' } let(:index_name) { '_test_reindex_index' }
let(:index) { double('index', name: index_name, schema: 'public', unique?: false, definition: 'CREATE INDEX _test_reindex_index ON public._test_reindex_table USING btree (_test_column)') } let(:index) { instance_double(Gitlab::Database::PostgresIndex, indexrelid: 42, name: index_name, schema: 'public', partitioned?: false, unique?: false, definition: 'CREATE INDEX _test_reindex_index ON public._test_reindex_table USING btree (_test_column)') }
let(:logger) { double('logger', debug: nil, info: nil, error: nil ) } let(:logger) { double('logger', debug: nil, info: nil, error: nil ) }
let(:connection) { ActiveRecord::Base.connection } let(:connection) { ActiveRecord::Base.connection }
...@@ -23,7 +23,9 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do ...@@ -23,7 +23,9 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do
end end
context 'when the index is unique' do context 'when the index is unique' do
let(:index) { double('index', name: index_name, unique?: true, definition: 'CREATE INDEX _test_reindex_index ON public._test_reindex_table USING btree (_test_column)') } before do
allow(index).to receive(:unique?).and_return(true)
end
it 'raises an error' do it 'raises an error' do
expect do expect do
...@@ -32,12 +34,29 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do ...@@ -32,12 +34,29 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do
end end
end end
context 'when the index is partitioned' do
before do
allow(index).to receive(:partitioned?).and_return(true)
end
it 'raises an error' do
expect do
subject.perform
end.to raise_error(described_class::ReindexError, /partitioned indexes are currently not supported/)
end
end
context 'replacing the original index with a rebuilt copy' do context 'replacing the original index with a rebuilt copy' do
let(:replacement_name) { 'tmp_reindex__test_reindex_index' } let(:replacement_name) { 'tmp_reindex_42' }
let(:replaced_name) { 'old_reindex__test_reindex_index' } let(:replaced_name) { 'old_reindex_42' }
let(:create_index) { "CREATE INDEX CONCURRENTLY #{replacement_name} ON public.#{table_name} USING btree (#{column_name})" } let(:create_index) { "CREATE INDEX CONCURRENTLY #{replacement_name} ON public.#{table_name} USING btree (#{column_name})" }
let(:drop_index) { "DROP INDEX CONCURRENTLY IF EXISTS #{replacement_name}" } let(:drop_index) do
<<~SQL
DROP INDEX CONCURRENTLY
IF EXISTS "public"."#{replacement_name}"
SQL
end
let!(:original_index) { find_index_create_statement } let!(:original_index) { find_index_create_statement }
...@@ -58,18 +77,17 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do ...@@ -58,18 +77,17 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do
end end
it 'replaces the existing index with an identical index' do it 'replaces the existing index with an identical index' do
expect(subject).to receive(:disable_statement_timeout).exactly(3).times.and_yield expect(subject).to receive(:disable_statement_timeout).twice.and_yield
expect_to_execute_concurrently_in_order(drop_index)
expect_to_execute_concurrently_in_order(create_index) expect_to_execute_concurrently_in_order(create_index)
expect_next_instance_of(::Gitlab::Database::WithLockRetries) do |instance| expect_next_instance_of(::Gitlab::Database::WithLockRetries) do |instance|
expect(instance).to receive(:run).with(raise_on_exhaustion: true).and_yield expect(instance).to receive(:run).with(raise_on_exhaustion: true).and_yield
end end
expect_to_execute_in_order("ALTER INDEX #{index.name} RENAME TO #{replaced_name}") expect_index_rename(index.name, replaced_name)
expect_to_execute_in_order("ALTER INDEX #{replacement_name} RENAME TO #{index.name}") expect_index_rename(replacement_name, index.name)
expect_to_execute_in_order("ALTER INDEX #{replaced_name} RENAME TO #{replacement_name}") expect_index_rename(replaced_name, replacement_name)
expect_to_execute_concurrently_in_order(drop_index) expect_to_execute_concurrently_in_order(drop_index)
...@@ -93,9 +111,9 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do ...@@ -93,9 +111,9 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do
expect(instance).to receive(:run).with(raise_on_exhaustion: true).and_yield expect(instance).to receive(:run).with(raise_on_exhaustion: true).and_yield
end end
expect_to_execute_in_order("ALTER INDEX #{index.name} RENAME TO #{replaced_name}") expect_index_rename(index.name, replaced_name)
expect_to_execute_in_order("ALTER INDEX #{replacement_name} RENAME TO #{index.name}") expect_index_rename(replacement_name, index.name)
expect_to_execute_in_order("ALTER INDEX #{replaced_name} RENAME TO #{replacement_name}") expect_index_rename(replaced_name, replacement_name)
expect_to_execute_concurrently_in_order(drop_index) expect_to_execute_concurrently_in_order(drop_index)
...@@ -107,14 +125,12 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do ...@@ -107,14 +125,12 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do
context 'when it fails to create the replacement index' do context 'when it fails to create the replacement index' do
it 'safely cleans up and signals the error' do it 'safely cleans up and signals the error' do
expect_to_execute_concurrently_in_order(drop_index)
expect(connection).to receive(:execute).with(create_index).ordered expect(connection).to receive(:execute).with(create_index).ordered
.and_raise(ActiveRecord::ConnectionTimeoutError, 'connect timeout') .and_raise(ActiveRecord::ConnectionTimeoutError, 'connect timeout')
expect_to_execute_concurrently_in_order(drop_index) expect_to_execute_concurrently_in_order(drop_index)
expect { subject.perform }.to raise_error(described_class::ReindexError, /connect timeout/) expect { subject.perform }.to raise_error(ActiveRecord::ConnectionTimeoutError, /connect timeout/)
check_index_exists check_index_exists
end end
...@@ -122,11 +138,10 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do ...@@ -122,11 +138,10 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do
context 'when the replacement index is not valid' do context 'when the replacement index is not valid' do
it 'safely cleans up and signals the error' do it 'safely cleans up and signals the error' do
expect_to_execute_concurrently_in_order(drop_index) replacement_index = double('replacement index', valid_index?: false)
expect_to_execute_concurrently_in_order(create_index) allow(Gitlab::Database::PostgresIndex).to receive(:find_by).with(schema: 'public', name: replacement_name).and_return(nil, replacement_index)
replacement_index = double('replacement index', valid?: false) expect_to_execute_concurrently_in_order(create_index)
allow(Gitlab::Database::Reindexing::Index).to receive(:find_with_schema).with("public.#{replacement_name}").and_return(replacement_index)
expect_to_execute_concurrently_in_order(drop_index) expect_to_execute_concurrently_in_order(drop_index)
...@@ -138,20 +153,20 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do ...@@ -138,20 +153,20 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do
context 'when a database error occurs while swapping the indexes' do context 'when a database error occurs while swapping the indexes' do
it 'safely cleans up and signals the error' do it 'safely cleans up and signals the error' do
expect_to_execute_concurrently_in_order(drop_index) replacement_index = double('replacement index', valid_index?: true)
allow(Gitlab::Database::PostgresIndex).to receive(:find_by).with(schema: 'public', name: replacement_name).and_return(nil, replacement_index)
expect_to_execute_concurrently_in_order(create_index) expect_to_execute_concurrently_in_order(create_index)
expect_next_instance_of(::Gitlab::Database::WithLockRetries) do |instance| expect_next_instance_of(::Gitlab::Database::WithLockRetries) do |instance|
expect(instance).to receive(:run).with(raise_on_exhaustion: true).and_yield expect(instance).to receive(:run).with(raise_on_exhaustion: true).and_yield
end end
expect(connection).to receive(:execute).ordered expect_index_rename(index.name, replaced_name).and_raise(ActiveRecord::ConnectionTimeoutError, 'connect timeout')
.with("ALTER INDEX #{index.name} RENAME TO #{replaced_name}")
.and_raise(ActiveRecord::ConnectionTimeoutError, 'connect timeout')
expect_to_execute_concurrently_in_order(drop_index) expect_to_execute_concurrently_in_order(drop_index)
expect { subject.perform }.to raise_error(described_class::ReindexError, /connect timeout/) expect { subject.perform }.to raise_error(ActiveRecord::ConnectionTimeoutError, /connect timeout/)
check_index_exists check_index_exists
end end
...@@ -159,7 +174,6 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do ...@@ -159,7 +174,6 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do
context 'when with_lock_retries fails to acquire the lock' do context 'when with_lock_retries fails to acquire the lock' do
it 'safely cleans up and signals the error' do it 'safely cleans up and signals the error' do
expect_to_execute_concurrently_in_order(drop_index)
expect_to_execute_concurrently_in_order(create_index) expect_to_execute_concurrently_in_order(create_index)
expect_next_instance_of(::Gitlab::Database::WithLockRetries) do |instance| expect_next_instance_of(::Gitlab::Database::WithLockRetries) do |instance|
...@@ -169,7 +183,7 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do ...@@ -169,7 +183,7 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do
expect_to_execute_concurrently_in_order(drop_index) expect_to_execute_concurrently_in_order(drop_index)
expect { subject.perform }.to raise_error(described_class::ReindexError, /exhausted/) expect { subject.perform }.to raise_error(::Gitlab::Database::WithLockRetries::AttemptsExhaustedError, /exhausted/)
check_index_exists check_index_exists
end end
...@@ -185,8 +199,11 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do ...@@ -185,8 +199,11 @@ RSpec.describe Gitlab::Database::Reindexing::ConcurrentReindex, '#perform' do
end end
end end
def expect_to_execute_in_order(sql) def expect_index_rename(from, to)
expect(connection).to receive(:execute).with(sql).ordered.and_call_original expect(connection).to receive(:execute).with(<<~SQL).ordered
ALTER INDEX "public"."#{from}"
RENAME TO "#{to}"
SQL
end end
def find_index_create_statement def find_index_create_statement
......
# frozen_string_literal: true
require 'spec_helper'
RSpec.describe Gitlab::Database::Reindexing do
describe '.perform' do
context 'multiple indexes' do
let(:indexes) { [double, double] }
let(:reindexers) { [double, double] }
it 'performs concurrent reindexing for each index' do
indexes.zip(reindexers).each do |index, reindexer|
expect(Gitlab::Database::Reindexing::ConcurrentReindex).to receive(:new).with(index).ordered.and_return(reindexer)
expect(reindexer).to receive(:perform)
end
described_class.perform(indexes)
end
end
context 'single index' do
let(:index) { double }
let(:reindexer) { double }
it 'performs concurrent reindexing for single index' do
expect(Gitlab::Database::Reindexing::ConcurrentReindex).to receive(:new).with(index).and_return(reindexer)
expect(reindexer).to receive(:perform)
described_class.perform(index)
end
end
end
end
...@@ -165,30 +165,32 @@ RSpec.describe 'gitlab:db namespace rake task' do ...@@ -165,30 +165,32 @@ RSpec.describe 'gitlab:db namespace rake task' do
end end
describe 'reindex' do describe 'reindex' do
let(:reindex) { double('reindex') }
let(:indexes) { double('indexes') }
context 'when no index_name is given' do context 'when no index_name is given' do
it 'raises an error' do it 'rebuilds a random number of large indexes' do
expect do expect(Gitlab::Database::PostgresIndex).to receive_message_chain('non_unique.non_partitioned.random_few').and_return(indexes)
run_rake_task('gitlab:db:reindex', '') expect(Gitlab::Database::Reindexing).to receive(:perform).with(indexes)
end.to raise_error(ArgumentError, /must give the index name/)
run_rake_task('gitlab:db:reindex')
end end
end end
context 'with index name given' do context 'with index name given' do
let(:index) { double('index') } let(:index) { double('index') }
let(:reindex) { double('reindex') }
it 'calls the index rebuilder with the proper arguments' do it 'calls the index rebuilder with the proper arguments' do
expect(Gitlab::Database::Reindexing::Index).to receive(:find_with_schema).with('public.foo_idx').and_return(index) expect(Gitlab::Database::PostgresIndex).to receive(:by_identifier).with('public.foo_idx').and_return(index)
expect(Gitlab::Database::Reindexing::ConcurrentReindex).to receive(:new).with(index, any_args).and_return(reindex) expect(Gitlab::Database::Reindexing).to receive(:perform).with(index)
expect(reindex).to receive(:perform)
run_rake_task('gitlab:db:reindex', '[public.foo_idx]') run_rake_task('gitlab:db:reindex', '[public.foo_idx]')
end end
it 'raises an error if the index does not exist' do it 'raises an error if the index does not exist' do
expect(Gitlab::Database::Reindexing::Index).to receive(:find_with_schema).with('public.absent_index').and_return(nil) expect(Gitlab::Database::PostgresIndex).to receive(:by_identifier).with('public.absent_index').and_raise(ActiveRecord::RecordNotFound)
expect { run_rake_task('gitlab:db:reindex', '[public.absent_index]') }.to raise_error(ArgumentError, /index does not exist/) expect { run_rake_task('gitlab:db:reindex', '[public.absent_index]') }.to raise_error(ActiveRecord::RecordNotFound)
end end
end end
end end
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment