Commit f1f55e6e authored by Dylan Griffith's avatar Dylan Griffith

Fix more N+1 issues when indexing notes in Elasticsearch

Since we already had an N+1 test this required a couple of changes to
detect these problems:

1. Add `:elastic` to the test setup in order to allow for GitLab to
   finish setting up the Elasticsearch index and ensure that the
   `remove_permissions_data_from_notes_documents` was considered finished.
   Without this we couldn't trigger the logic to load project permissions
   for the notes
   https://gitlab.com/gitlab-org/gitlab/-/blob/02f78e50879aa2e9facafe724a61e20d4640a342/ee/lib/elastic/latest/note_instance_proxy.rb#L33
2. We also needed to move a `stub_const` into a separate test block so
   it didn't interfere with the N+1 test for notes. Without this we weren't
   actually processing all the notes and the test was a false
   positive.  The `stub_const` here was only necessary for the one test
   that actually tests this limit. It was actually interfering with some
   other N+1 tests where we were adding more than 10 documents. As such
   moving this closer to the relevant test makes more sense. It also
   required updating a few of the other tests to stop referring to the
   `limit` variable. This value was always equal to the number of documents
   in `fake_refs` anyway so it was unnecessary to have this variable.
parent d99352f7
---
title: Fix more N+1 issues when indexing notes in Elasticsearch
merge_request: 58751
author:
type: performance
...@@ -26,7 +26,7 @@ module Elastic ...@@ -26,7 +26,7 @@ module Elastic
# rubocop: disable CodeReuse/ActiveRecord # rubocop: disable CodeReuse/ActiveRecord
def preload_indexing_data(relation) def preload_indexing_data(relation)
relation.includes(noteable: :assignees) relation.includes(noteable: :assignees, project: [:project_feature, :route])
end end
# rubocop: enable CodeReuse/ActiveRecord # rubocop: enable CodeReuse/ActiveRecord
......
...@@ -2,7 +2,7 @@ ...@@ -2,7 +2,7 @@
require 'spec_helper' require 'spec_helper'
RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_state do RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_state, :elastic do
let(:ref_class) { ::Gitlab::Elastic::DocumentReference } let(:ref_class) { ::Gitlab::Elastic::DocumentReference }
let(:fake_refs) { Array.new(10) { |i| ref_class.new(Issue, i, "issue_#{i}", 'project_1') } } let(:fake_refs) { Array.new(10) { |i| ref_class.new(Issue, i, "issue_#{i}", 'project_1') } }
...@@ -125,25 +125,19 @@ RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_st ...@@ -125,25 +125,19 @@ RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_st
end end
describe '#execute' do describe '#execute' do
let(:shard_limit) { 5 } context 'limit is less than refs count' do
let(:shard_number) { 2 }
let(:limit) { shard_limit * shard_number }
before do before do
stub_const('Elastic::ProcessBookkeepingService::SHARD_LIMIT', shard_limit) stub_const('Elastic::ProcessBookkeepingService::SHARD_LIMIT', 2)
stub_const('Elastic::ProcessBookkeepingService::SHARDS_NUMBER', shard_number) stub_const('Elastic::ProcessBookkeepingService::SHARDS_NUMBER', 2)
end end
context 'limit is less than refs count' do
let(:shard_limit) { 2 }
it 'processes only up to limit' do it 'processes only up to limit' do
described_class.track!(*fake_refs) described_class.track!(*fake_refs)
expect(described_class.queue_size).to eq(fake_refs.size) expect(described_class.queue_size).to eq(fake_refs.size)
allow_processing(*fake_refs) allow_processing(*fake_refs)
expect { described_class.new.execute }.to change(described_class, :queue_size).by(-limit) expect { described_class.new.execute }.to change(described_class, :queue_size).by(-4)
end end
end end
...@@ -151,17 +145,17 @@ RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_st ...@@ -151,17 +145,17 @@ RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_st
described_class.track!(*fake_refs) described_class.track!(*fake_refs)
expect(described_class.queue_size).to eq(fake_refs.size) expect(described_class.queue_size).to eq(fake_refs.size)
expect_processing(*fake_refs[0...limit]) expect_processing(*fake_refs)
expect { described_class.new.execute }.to change(described_class, :queue_size).by(-limit) expect { described_class.new.execute }.to change(described_class, :queue_size).by(-fake_refs.count)
end end
it 'returns the number of documents processed' do it 'returns the number of documents processed' do
described_class.track!(*fake_refs) described_class.track!(*fake_refs)
expect_processing(*fake_refs[0...limit]) expect_processing(*fake_refs)
expect(described_class.new.execute).to eq(limit) expect(described_class.new.execute).to eq(fake_refs.count)
end end
it 'returns 0 without writing to the index when there are no documents' do it 'returns 0 without writing to the index when there are no documents' do
...@@ -175,9 +169,9 @@ RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_st ...@@ -175,9 +169,9 @@ RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_st
failed = fake_refs[0] failed = fake_refs[0]
expect(described_class.queue_size).to eq(10) expect(described_class.queue_size).to eq(10)
expect_processing(*fake_refs[0...limit], failures: [failed]) expect_processing(*fake_refs, failures: [failed])
expect { described_class.new.execute }.to change(described_class, :queue_size).by(-limit + 1) expect { described_class.new.execute }.to change(described_class, :queue_size).by(-fake_refs.count + 1)
shard = described_class.shard_number(failed.serialize) shard = described_class.shard_number(failed.serialize)
serialized = described_class.queued_items[shard].first[0] serialized = described_class.queued_items[shard].first[0]
...@@ -224,6 +218,11 @@ RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_st ...@@ -224,6 +218,11 @@ RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_st
end end
it 'does not have N+1 queries for notes' do it 'does not have N+1 queries for notes' do
# Gitaly N+1 calls when processing notes on commits
# https://gitlab.com/gitlab-org/gitlab/-/issues/327086 . Even though
# this block is in the spec there is still an N+1 to fix in the actual
# code.
Gitlab::GitalyClient.allow_n_plus_1_calls do
notes = [] notes = []
2.times do 2.times do
...@@ -231,6 +230,7 @@ RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_st ...@@ -231,6 +230,7 @@ RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_st
notes << create(:discussion_note_on_merge_request) notes << create(:discussion_note_on_merge_request)
notes << create(:note_on_merge_request) notes << create(:note_on_merge_request)
notes << create(:note_on_commit) notes << create(:note_on_commit)
notes << create(:diff_note_on_merge_request)
end end
described_class.track!(*notes) described_class.track!(*notes)
...@@ -242,12 +242,14 @@ RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_st ...@@ -242,12 +242,14 @@ RSpec.describe Elastic::ProcessBookkeepingService, :clean_gitlab_redis_shared_st
notes << create(:discussion_note_on_merge_request) notes << create(:discussion_note_on_merge_request)
notes << create(:note_on_merge_request) notes << create(:note_on_merge_request)
notes << create(:note_on_commit) notes << create(:note_on_commit)
notes << create(:diff_note_on_merge_request)
end end
described_class.track!(*notes) described_class.track!(*notes)
expect { described_class.new.execute }.not_to exceed_all_query_limit(control) expect { described_class.new.execute }.not_to exceed_all_query_limit(control)
end end
end
it 'does not have N+1 queries for issues' do it 'does not have N+1 queries for issues' do
issues = create_list(:issue, 2) issues = create_list(:issue, 2)
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment