Commit 7473e4a3 authored by Andreas Brandl's avatar Andreas Brandl

Merge branch 'osw-improve-discussions-query' into 'master'

Considerably improve the query performance for MR discussions load

See merge request gitlab-org/gitlab!16635
parents 220e1fdb 71a1a017
...@@ -211,7 +211,7 @@ class Projects::MergeRequestsController < Projects::MergeRequests::ApplicationCo ...@@ -211,7 +211,7 @@ class Projects::MergeRequestsController < Projects::MergeRequests::ApplicationCo
end end
def discussions def discussions
merge_request.preload_discussions_diff_highlight merge_request.discussions_diffs.load_highlight
super super
end end
......
...@@ -108,13 +108,10 @@ class DiffNote < Note ...@@ -108,13 +108,10 @@ class DiffNote < Note
end end
def fetch_diff_file def fetch_diff_file
return note_diff_file.raw_diff_file if note_diff_file
file = file =
if note_diff_file if created_at_diff?(noteable.diff_refs)
diff = Gitlab::Git::Diff.new(note_diff_file.to_hash)
Gitlab::Diff::File.new(diff,
repository: repository,
diff_refs: original_position.diff_refs)
elsif created_at_diff?(noteable.diff_refs)
# We're able to use the already persisted diffs (Postgres) if we're # We're able to use the already persisted diffs (Postgres) if we're
# presenting a "current version" of the MR discussion diff. # presenting a "current version" of the MR discussion diff.
# So no need to make an extra Gitaly diff request for it. # So no need to make an extra Gitaly diff request for it.
...@@ -126,9 +123,7 @@ class DiffNote < Note ...@@ -126,9 +123,7 @@ class DiffNote < Note
original_position.diff_file(repository) original_position.diff_file(repository)
end end
# Since persisted diff files already have its content "unfolded" file&.unfold_diff_lines(position)
# there's no need to make it pass through the unfolding process.
file&.unfold_diff_lines(position) unless note_diff_file
file file
end end
......
...@@ -454,24 +454,17 @@ class MergeRequest < ApplicationRecord ...@@ -454,24 +454,17 @@ class MergeRequest < ApplicationRecord
true true
end end
def preload_discussions_diff_highlight
preloadable_files = note_diff_files.for_commit_or_unresolved
discussions_diffs.load_highlight(preloadable_files.pluck(:id))
end
def discussions_diffs def discussions_diffs
strong_memoize(:discussions_diffs) do strong_memoize(:discussions_diffs) do
note_diff_files = NoteDiffFile
.joins(:diff_note)
.merge(notes.or(commit_notes))
.includes(diff_note: :project)
Gitlab::DiscussionsDiff::FileCollection.new(note_diff_files.to_a) Gitlab::DiscussionsDiff::FileCollection.new(note_diff_files.to_a)
end end
end end
def note_diff_files
NoteDiffFile
.where(diff_note: discussion_notes)
.includes(diff_note: :project)
end
def diff_size def diff_size
# Calling `merge_request_diff.diffs.real_size` will also perform # Calling `merge_request_diff.diffs.real_size` will also perform
# highlighting, which we don't need here. # highlighting, which we don't need here.
......
...@@ -3,15 +3,11 @@ ...@@ -3,15 +3,11 @@
class NoteDiffFile < ApplicationRecord class NoteDiffFile < ApplicationRecord
include DiffFile include DiffFile
scope :for_commit_or_unresolved, -> do
joins(:diff_note).where("resolved_at IS NULL OR noteable_type = 'Commit'")
end
scope :referencing_sha, -> (oids, project_id:) do scope :referencing_sha, -> (oids, project_id:) do
joins(:diff_note).where(notes: { project_id: project_id, commit_id: oids }) joins(:diff_note).where(notes: { project_id: project_id, commit_id: oids })
end end
delegate :original_position, :project, to: :diff_note delegate :original_position, :project, :resolved_at, to: :diff_note
belongs_to :diff_note, inverse_of: :note_diff_file belongs_to :diff_note, inverse_of: :note_diff_file
......
---
title: Considerably improve the query performance for MR discussions load
merge_request: 16635
author:
type: performance
...@@ -4,11 +4,16 @@ module Gitlab ...@@ -4,11 +4,16 @@ module Gitlab
module DiscussionsDiff module DiscussionsDiff
class FileCollection class FileCollection
include Gitlab::Utils::StrongMemoize include Gitlab::Utils::StrongMemoize
include Enumerable
def initialize(collection) def initialize(collection)
@collection = collection @collection = collection
end end
def each(&block)
@collection.each(&block)
end
# Returns a Gitlab::Diff::File with the given ID (`unique_identifier` in # Returns a Gitlab::Diff::File with the given ID (`unique_identifier` in
# Gitlab::Diff::File). # Gitlab::Diff::File).
def find_by_id(id) def find_by_id(id)
...@@ -16,20 +21,12 @@ module Gitlab ...@@ -16,20 +21,12 @@ module Gitlab
end end
# Writes cache and preloads highlighted diff lines for # Writes cache and preloads highlighted diff lines for
# object IDs, in @collection. # highlightable object IDs, in @collection.
#
# highlightable_ids - Diff file `Array` responding to ID. The ID will be used
# to generate the cache key.
# #
# - Highlight cache is written just for uncached diff files # - Highlight cache is written just for uncached diff files
# - The cache content is not updated (there's no need to do so) # - The cache content is not updated (there's no need to do so)
def load_highlight(highlightable_ids) def load_highlight
preload_highlighted_lines(highlightable_ids) ids = highlightable_collection_ids
end
private
def preload_highlighted_lines(ids)
cached_content = read_cache(ids) cached_content = read_cache(ids)
uncached_ids = ids.select.each_with_index { |_, i| cached_content[i].nil? } uncached_ids = ids.select.each_with_index { |_, i| cached_content[i].nil? }
...@@ -46,6 +43,12 @@ module Gitlab ...@@ -46,6 +43,12 @@ module Gitlab
end end
end end
private
def highlightable_collection_ids
each.with_object([]) { |file, memo| memo << file.id unless file.resolved_at }
end
def read_cache(ids) def read_cache(ids)
HighlightCache.read_multiple(ids) HighlightCache.read_multiple(ids)
end end
...@@ -57,9 +60,7 @@ module Gitlab ...@@ -57,9 +60,7 @@ module Gitlab
end end
def diff_files def diff_files
strong_memoize(:diff_files) do strong_memoize(:diff_files) { map(&:raw_diff_file) }
@collection.map(&:raw_diff_file)
end
end end
# Processes the diff lines highlighting for diff files matching the given # Processes the diff lines highlighting for diff files matching the given
......
...@@ -1289,7 +1289,7 @@ describe Projects::MergeRequestsController do ...@@ -1289,7 +1289,7 @@ describe Projects::MergeRequestsController do
expect_next_instance_of(Gitlab::DiscussionsDiff::FileCollection) do |collection| expect_next_instance_of(Gitlab::DiscussionsDiff::FileCollection) do |collection|
note_diff_file = commit_diff_note.note_diff_file note_diff_file = commit_diff_note.note_diff_file
expect(collection).to receive(:load_highlight).with([note_diff_file.id]).and_call_original expect(collection).to receive(:load_highlight).and_call_original
expect(collection).to receive(:find_by_id).with(note_diff_file.id).and_call_original expect(collection).to receive(:find_by_id).with(note_diff_file.id).and_call_original
end end
...@@ -1306,7 +1306,7 @@ describe Projects::MergeRequestsController do ...@@ -1306,7 +1306,7 @@ describe Projects::MergeRequestsController do
expect_next_instance_of(Gitlab::DiscussionsDiff::FileCollection) do |collection| expect_next_instance_of(Gitlab::DiscussionsDiff::FileCollection) do |collection|
note_diff_file = diff_note.note_diff_file note_diff_file = diff_note.note_diff_file
expect(collection).to receive(:load_highlight).with([note_diff_file.id]).and_call_original expect(collection).to receive(:load_highlight).and_call_original
expect(collection).to receive(:find_by_id).with(note_diff_file.id).and_call_original expect(collection).to receive(:find_by_id).with(note_diff_file.id).and_call_original
end end
...@@ -1319,7 +1319,7 @@ describe Projects::MergeRequestsController do ...@@ -1319,7 +1319,7 @@ describe Projects::MergeRequestsController do
expect_next_instance_of(Gitlab::DiscussionsDiff::FileCollection) do |collection| expect_next_instance_of(Gitlab::DiscussionsDiff::FileCollection) do |collection|
note_diff_file = diff_note.note_diff_file note_diff_file = diff_note.note_diff_file
expect(collection).to receive(:load_highlight).with([]).and_call_original expect(collection).to receive(:load_highlight).and_call_original
expect(collection).to receive(:find_by_id).with(note_diff_file.id).and_call_original expect(collection).to receive(:find_by_id).with(note_diff_file.id).and_call_original
end end
......
...@@ -22,11 +22,13 @@ describe Gitlab::DiscussionsDiff::FileCollection do ...@@ -22,11 +22,13 @@ describe Gitlab::DiscussionsDiff::FileCollection do
note_diff_file_b.id => file_b_caching_content }) note_diff_file_b.id => file_b_caching_content })
.and_call_original .and_call_original
subject.load_highlight([note_diff_file_a.id, note_diff_file_b.id]) subject.load_highlight
end end
it 'does not write cache for already cached file' do it 'does not write cache for already cached file' do
subject.load_highlight([note_diff_file_a.id]) file_a_caching_content = diff_note_a.diff_file.highlighted_diff_lines.map(&:to_hash)
Gitlab::DiscussionsDiff::HighlightCache
.write_multiple({ note_diff_file_a.id => file_a_caching_content })
file_b_caching_content = diff_note_b.diff_file.highlighted_diff_lines.map(&:to_hash) file_b_caching_content = diff_note_b.diff_file.highlighted_diff_lines.map(&:to_hash)
...@@ -35,27 +37,42 @@ describe Gitlab::DiscussionsDiff::FileCollection do ...@@ -35,27 +37,42 @@ describe Gitlab::DiscussionsDiff::FileCollection do
.with({ note_diff_file_b.id => file_b_caching_content }) .with({ note_diff_file_b.id => file_b_caching_content })
.and_call_original .and_call_original
subject.load_highlight([note_diff_file_a.id, note_diff_file_b.id]) subject.load_highlight
end end
it 'does not err when given ID does not exist in @collection' do it 'does not write cache for resolved notes' do
expect { subject.load_highlight([999]) }.not_to raise_error diff_note_a.update_column(:resolved_at, Time.now)
file_b_caching_content = diff_note_b.diff_file.highlighted_diff_lines.map(&:to_hash)
expect(Gitlab::DiscussionsDiff::HighlightCache)
.to receive(:write_multiple)
.with({ note_diff_file_b.id => file_b_caching_content })
.and_call_original
subject.load_highlight
end end
it 'loaded diff files have highlighted lines loaded' do it 'loaded diff files have highlighted lines loaded' do
subject.load_highlight([note_diff_file_a.id]) subject.load_highlight
diff_file = subject.find_by_id(note_diff_file_a.id) diff_file_a = subject.find_by_id(note_diff_file_a.id)
diff_file_b = subject.find_by_id(note_diff_file_b.id)
expect(diff_file.highlight_loaded?).to be(true) expect(diff_file_a).to be_highlight_loaded
expect(diff_file_b).to be_highlight_loaded
end end
it 'not loaded diff files does not have highlighted lines loaded' do it 'not loaded diff files does not have highlighted lines loaded' do
subject.load_highlight([note_diff_file_a.id]) diff_note_a.update_column(:resolved_at, Time.now)
subject.load_highlight
diff_file = subject.find_by_id(note_diff_file_b.id) diff_file_a = subject.find_by_id(note_diff_file_a.id)
diff_file_b = subject.find_by_id(note_diff_file_b.id)
expect(diff_file.highlight_loaded?).to be(false) expect(diff_file_a).not_to be_highlight_loaded
expect(diff_file_b).to be_highlight_loaded
end end
end end
end end
...@@ -650,54 +650,55 @@ describe MergeRequest do ...@@ -650,54 +650,55 @@ describe MergeRequest do
end end
end end
describe '#preload_discussions_diff_highlight' do describe '#discussions_diffs' do
let(:merge_request) { create(:merge_request) } let(:merge_request) { create(:merge_request) }
context 'with commit diff note' do shared_examples 'discussions diffs collection' do
let(:other_merge_request) { create(:merge_request) } it 'initializes Gitlab::DiscussionsDiff::FileCollection with correct data' do
note_diff_file = diff_note.note_diff_file
let!(:diff_note) do expect(Gitlab::DiscussionsDiff::FileCollection)
create(:diff_note_on_commit, project: merge_request.project) .to receive(:new)
end .with([note_diff_file])
.and_call_original
let!(:other_mr_diff_note) do result = merge_request.discussions_diffs
create(:diff_note_on_commit, project: other_merge_request.project)
expect(result).to be_a(Gitlab::DiscussionsDiff::FileCollection)
end end
it 'preloads diff highlighting' do it 'eager loads relations' do
expect_next_instance_of(Gitlab::DiscussionsDiff::FileCollection) do |collection| result = merge_request.discussions_diffs
note_diff_file = diff_note.note_diff_file
expect(collection) recorder = ActiveRecord::QueryRecorder.new do
.to receive(:load_highlight) result.first.diff_note
.with([note_diff_file.id]).and_call_original result.first.diff_note.project
end end
merge_request.preload_discussions_diff_highlight expect(recorder.count).to be_zero
end end
end end
context 'with merge request diff note' do context 'with commit diff note' do
let!(:unresolved_diff_note) do let(:other_merge_request) { create(:merge_request) }
create(:diff_note_on_merge_request, project: merge_request.project, noteable: merge_request)
end
let!(:resolved_diff_note) do let!(:diff_note) do
create(:diff_note_on_merge_request, :resolved, project: merge_request.project, noteable: merge_request) create(:diff_note_on_commit, project: merge_request.project)
end end
it 'preloads diff highlighting' do let!(:other_mr_diff_note) do
expect_next_instance_of(Gitlab::DiscussionsDiff::FileCollection) do |collection| create(:diff_note_on_commit, project: other_merge_request.project)
note_diff_file = unresolved_diff_note.note_diff_file end
expect(collection) it_behaves_like 'discussions diffs collection'
.to receive(:load_highlight)
.with([note_diff_file.id])
.and_call_original
end end
merge_request.preload_discussions_diff_highlight context 'with merge request diff note' do
let!(:diff_note) do
create(:diff_note_on_merge_request, project: merge_request.project, noteable: merge_request)
end end
it_behaves_like 'discussions diffs collection'
end end
end end
......
# frozen_string_literal: true
require 'spec_helper'
describe 'merge requests discussions' do
# Further tests can be found at merge_requests_controller_spec.rb
describe 'GET /:namespace/:project/merge_requests/:iid/discussions' do
let(:project) { create(:project, :repository) }
let(:user) { project.owner }
let(:merge_request) { create(:merge_request_with_diffs, target_project: project, source_project: project) }
before do
project.add_developer(user)
login_as(user)
end
def send_request
get discussions_namespace_project_merge_request_path(namespace_id: project.namespace, project_id: project, id: merge_request.iid)
end
it 'returns 200' do
send_request
expect(response.status).to eq(200)
end
# https://docs.gitlab.com/ee/development/query_recorder.html#use-request-specs-instead-of-controller-specs
it 'avoids N+1 DB queries', :request_store do
control = ActiveRecord::QueryRecorder.new { send_request }
create(:diff_note_on_merge_request, noteable: merge_request,
project: merge_request.project)
expect do
send_request
end.not_to exceed_query_limit(control)
end
it 'limits Gitaly queries', :request_store do
Gitlab::GitalyClient.allow_n_plus_1_calls do
create_list(:diff_note_on_merge_request, 7, noteable: merge_request,
project: merge_request.project)
end
# The creations above write into the Gitaly counts
Gitlab::GitalyClient.reset_counts
expect { send_request }
.to change { Gitlab::GitalyClient.get_request_count }.by_at_most(4)
end
end
end
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment