Commit 55542258 authored by Kerri Miller's avatar Kerri Miller

Merge branch '347015-refactor-ipynbdiff-implementation' into 'master'

Resolve "Refactor Ipynbdiff Implementation"

See merge request gitlab-org/gitlab!75718
parents 21fc0769 e653f4c8
...@@ -15,19 +15,8 @@ class BlobPresenter < Gitlab::View::Presenter::Delegated ...@@ -15,19 +15,8 @@ class BlobPresenter < Gitlab::View::Presenter::Delegated
Gitlab::Highlight.highlight( Gitlab::Highlight.highlight(
blob.path, blob.path,
limited_blob_data(to: to), blob_data(to),
language: language, language: blob_language,
plain: plain
)
end
def highlight_transformed(plain: nil)
load_all_blob_data
Gitlab::Highlight.highlight(
blob.path,
transformed_blob_data,
language: transformed_blob_language,
plain: plain plain: plain
) )
end end
...@@ -38,6 +27,14 @@ class BlobPresenter < Gitlab::View::Presenter::Delegated ...@@ -38,6 +27,14 @@ class BlobPresenter < Gitlab::View::Presenter::Delegated
highlight(plain: false) highlight(plain: false)
end end
def blob_data(to)
@_blob_data ||= Gitlab::Diff::CustomDiff.transformed_blob_data(blob) || limited_blob_data(to: to)
end
def blob_language
@_blob_language ||= Gitlab::Diff::CustomDiff.transformed_blob_language(blob) || language
end
def raw_plain_data def raw_plain_data
blob.data unless blob.binary? blob.data unless blob.binary?
end end
...@@ -134,23 +131,6 @@ class BlobPresenter < Gitlab::View::Presenter::Delegated ...@@ -134,23 +131,6 @@ class BlobPresenter < Gitlab::View::Presenter::Delegated
def language def language
blob.language_from_gitattributes blob.language_from_gitattributes
end end
def transformed_blob_language
@transformed_blob_language ||= blob.path.ends_with?('.ipynb') ? 'md' : language
end
def transformed_blob_data
@transformed_blob ||= if blob.path.ends_with?('.ipynb') && blob.transformed_for_diff
IpynbDiff.transform(blob.data,
raise_errors: true,
options: { include_metadata: false, cell_decorator: :percent })
end
@transformed_blob ||= blob.data
rescue IpynbDiff::InvalidNotebookError => e
Gitlab::ErrorTracking.log_exception(e)
blob.data
end
end end
BlobPresenter.prepend_mod_with('BlobPresenter') BlobPresenter.prepend_mod_with('BlobPresenter')
# frozen_string_literal: true
module Gitlab
module Diff
module CustomDiff
class << self
def preprocess_before_diff(path, old_blob, new_blob)
return unless path.ends_with? '.ipynb'
transformed_diff(old_blob&.data, new_blob&.data)&.tap do
transformed_for_diff(new_blob, old_blob)
Gitlab::AppLogger.info({ message: 'IPYNB_DIFF_GENERATED' })
end
rescue IpynbDiff::InvalidNotebookError => e
Gitlab::ErrorTracking.log_exception(e)
nil
end
def transformed_diff(before, after)
transformed_diff = IpynbDiff.diff(before, after,
diff_opts: { context: 5, include_diff_info: true },
transform_options: { cell_decorator: :percent },
raise_if_invalid_notebook: true)
strip_diff_frontmatter(transformed_diff)
end
def transformed_blob_language(blob)
'md' if transformed_for_diff?(blob)
end
def transformed_blob_data(blob)
if transformed_for_diff?(blob)
IpynbDiff.transform(blob.data,
raise_errors: true,
options: { include_metadata: false, cell_decorator: :percent })
end
end
def strip_diff_frontmatter(diff_content)
diff_content.scan(/.*\n/)[2..-1]&.join('') if diff_content.present?
end
def blobs_with_transformed_diffs
@blobs_with_transformed_diffs ||= {}
end
def transformed_for_diff?(blob)
blobs_with_transformed_diffs[blob]
end
def transformed_for_diff(*blobs)
blobs.each do |b|
blobs_with_transformed_diffs[b] = true if b
end
end
end
end
end
end
...@@ -44,7 +44,11 @@ module Gitlab ...@@ -44,7 +44,11 @@ module Gitlab
new_blob_lazy new_blob_lazy
old_blob_lazy old_blob_lazy
preprocess_before_diff(diff) if Feature.enabled?(:jupyter_clean_diffs, repository.project, default_enabled: true) diff.diff = Gitlab::Diff::CustomDiff.preprocess_before_diff(diff.new_path, old_blob_lazy, new_blob_lazy) || diff.diff if use_custom_diff?
end
def use_custom_diff?
strong_memoize(:_custom_diff_enabled) { Feature.enabled?(:jupyter_clean_diffs, repository.project, default_enabled: true) }
end end
def position(position_marker, position_type: :text) def position(position_marker, position_type: :text)
...@@ -450,33 +454,6 @@ module Gitlab ...@@ -450,33 +454,6 @@ module Gitlab
find_renderable_viewer_class(classes) find_renderable_viewer_class(classes)
end end
def preprocess_before_diff(diff)
return unless diff.new_path.ends_with? '.ipynb'
from = old_blob_lazy&.data
to = new_blob_lazy&.data
transformed_diff = IpynbDiff.diff(from, to,
diff_opts: { context: 5, include_diff_info: true },
transform_options: { cell_decorator: :percent },
raise_if_invalid_notebook: true)
new_diff = strip_diff_frontmatter(transformed_diff)
if new_diff
diff.diff = new_diff
new_blob_lazy.transformed_for_diff = true if new_blob_lazy
old_blob_lazy.transformed_for_diff = true if old_blob_lazy
end
Gitlab::AppLogger.info({ message: new_diff ? 'IPYNB_DIFF_GENERATED' : 'IPYNB_DIFF_NIL' })
rescue IpynbDiff::InvalidNotebookError => e
Gitlab::ErrorTracking.log_exception(e)
end
def strip_diff_frontmatter(diff_content)
diff_content.scan(/.*\n/)[2..-1]&.join('') if diff_content.present?
end
def alternate_viewer_class def alternate_viewer_class
return unless viewer.instance_of?(DiffViewer::Renamed) return unless viewer.instance_of?(DiffViewer::Renamed)
......
...@@ -153,8 +153,6 @@ module Gitlab ...@@ -153,8 +153,6 @@ module Gitlab
blob.load_all_data! blob.load_all_data!
return blob.present.highlight_transformed.lines if Feature.enabled?(:jupyter_clean_diffs, @project, default_enabled: true)
blob.present.highlight.lines blob.present.highlight.lines
end end
......
...@@ -24,7 +24,7 @@ module Gitlab ...@@ -24,7 +24,7 @@ module Gitlab
LFS_POINTER_MIN_SIZE = 120.bytes LFS_POINTER_MIN_SIZE = 120.bytes
LFS_POINTER_MAX_SIZE = 200.bytes LFS_POINTER_MAX_SIZE = 200.bytes
attr_accessor :size, :mode, :id, :commit_id, :loaded_size, :binary, :transformed_for_diff attr_accessor :size, :mode, :id, :commit_id, :loaded_size, :binary
attr_writer :name, :path, :data attr_writer :name, :path, :data
def self.gitlab_blob_truncated_true def self.gitlab_blob_truncated_true
...@@ -127,7 +127,6 @@ module Gitlab ...@@ -127,7 +127,6 @@ module Gitlab
# Retain the actual size before it is encoded # Retain the actual size before it is encoded
@loaded_size = @data.bytesize if @data @loaded_size = @data.bytesize if @data
@loaded_all_data = @loaded_size == size @loaded_all_data = @loaded_size == size
@transformed_for_diff = false
record_metric_blob_size record_metric_blob_size
record_metric_truncated(truncated?) record_metric_truncated(truncated?)
......
# frozen_string_literal: true
require 'spec_helper'
RSpec.describe Gitlab::Diff::CustomDiff do
include RepoHelpers
let(:project) { create(:project, :repository) }
let(:repository) { project.repository }
let(:ipynb_blob) { repository.blob_at('f6b7a707', 'files/ipython/markdown-table.ipynb') }
let(:blob) { repository.blob_at('HEAD', 'files/ruby/regex.rb') }
describe '#preprocess_before_diff' do
context 'for ipynb files' do
it 'transforms the diff' do
expect(described_class.preprocess_before_diff(ipynb_blob.path, nil, ipynb_blob)).not_to include('cells')
end
it 'adds the blob to the list of transformed blobs' do
described_class.preprocess_before_diff(ipynb_blob.path, nil, ipynb_blob)
expect(described_class.transformed_for_diff?(ipynb_blob)).to be_truthy
end
end
context 'for other files' do
it 'returns nil' do
expect(described_class.preprocess_before_diff(blob.path, nil, blob)).to be_nil
end
it 'does not add the blob to the list of transformed blobs' do
described_class.preprocess_before_diff(blob.path, nil, blob)
expect(described_class.transformed_for_diff?(blob)).to be_falsey
end
end
end
describe '#transformed_blob_data' do
it 'transforms blob data if file was processed' do
described_class.preprocess_before_diff(ipynb_blob.path, nil, ipynb_blob)
expect(described_class.transformed_blob_data(ipynb_blob)).not_to include('cells')
end
it 'does not transform blob data if file was not processed' do
expect(described_class.transformed_blob_data(ipynb_blob)).to be_nil
end
end
describe '#transformed_blob_language' do
it 'is md when file was preprocessed' do
described_class.preprocess_before_diff(ipynb_blob.path, nil, ipynb_blob)
expect(described_class.transformed_blob_language(ipynb_blob)).to eq('md')
end
it 'is nil for a .ipynb blob that was not preprocessed' do
expect(described_class.transformed_blob_language(ipynb_blob)).to be_nil
end
end
end
...@@ -159,27 +159,25 @@ RSpec.describe BlobPresenter do ...@@ -159,27 +159,25 @@ RSpec.describe BlobPresenter do
presenter.highlight presenter.highlight
end end
end end
end
describe '#highlight_transformed' do
context 'when blob is ipynb' do context 'when blob is ipynb' do
let(:blob) { repository.blob_at('f6b7a707', 'files/ipython/markdown-table.ipynb') } let(:blob) { repository.blob_at('f6b7a707', 'files/ipython/markdown-table.ipynb') }
let(:git_blob) { blob.__getobj__ } let(:git_blob) { blob.__getobj__ }
before do before do
allow(git_blob).to receive(:transformed_for_diff).and_return(true) allow(Gitlab::Diff::CustomDiff).to receive(:transformed_for_diff?).and_return(true)
end end
it 'uses md as the transformed language' do it 'uses md as the transformed language' do
expect(Gitlab::Highlight).to receive(:highlight).with('files/ipython/markdown-table.ipynb', anything, plain: nil, language: 'md') expect(Gitlab::Highlight).to receive(:highlight).with('files/ipython/markdown-table.ipynb', anything, plain: nil, language: 'md')
presenter.highlight_transformed presenter.highlight
end end
it 'transforms the blob' do it 'transforms the blob' do
expect(Gitlab::Highlight).to receive(:highlight).with('files/ipython/markdown-table.ipynb', include("%%"), plain: nil, language: 'md') expect(Gitlab::Highlight).to receive(:highlight).with('files/ipython/markdown-table.ipynb', include("%%"), plain: nil, language: 'md')
presenter.highlight_transformed presenter.highlight
end end
end end
...@@ -197,7 +195,7 @@ RSpec.describe BlobPresenter do ...@@ -197,7 +195,7 @@ RSpec.describe BlobPresenter do
it 'does not transform the file' do it 'does not transform the file' do
expect(Gitlab::Highlight).to receive(:highlight).with('files/ruby/regex.rb', git_blob.data, plain: nil, language: 'ruby') expect(Gitlab::Highlight).to receive(:highlight).with('files/ruby/regex.rb', git_blob.data, plain: nil, language: 'ruby')
presenter.highlight_transformed presenter.highlight
end end
end end
end end
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment