Commit 4acff819 authored by Vitali Tatarintev's avatar Vitali Tatarintev

Merge branch '326425-add-support-to-generate-metrics-queries' into 'master'

Add support to generate metrics queries in instrumentation classes

See merge request gitlab-org/gitlab!62294
parents 0fe2e0bf 36d54200
...@@ -43,12 +43,16 @@ module Gitlab ...@@ -43,12 +43,16 @@ module Gitlab
finish: self.class.metric_finish&.call) finish: self.class.metric_finish&.call)
end end
def relation def to_sql
self.class.metric_relation.call.where(time_constraints) Gitlab::Usage::Metrics::Query.for(self.class.metric_operation, relation, self.class.column)
end end
private private
def relation
self.class.metric_relation.call.where(time_constraints)
end
def time_constraints def time_constraints
case time_frame case time_frame
when '28d' when '28d'
......
# frozen_string_literal: true
module Gitlab
module Usage
module Metrics
class Query
class << self
def for(operation, relation, column = nil, **extra)
case operation
when :count
count(relation, column)
when :distinct_count
distinct_count(relation, column)
when :sum
sum(relation, column)
when :estimate_batch_distinct_count
estimate_batch_distinct_count(relation, column)
when :histogram
histogram(relation, column, **extra)
else
raise ArgumentError, "#{operation} operation not supported"
end
end
private
def count(relation, column = nil)
raw_sql(relation, column)
end
def distinct_count(relation, column = nil)
raw_sql(relation, column, true)
end
def sum(relation, column)
relation.select(relation.all.table[column].sum).to_sql
end
def estimate_batch_distinct_count(relation, column = nil)
raw_sql(relation, column, true)
end
# rubocop: disable CodeReuse/ActiveRecord
def histogram(relation, column, buckets:, bucket_size: buckets.size)
count_grouped = relation.group(column).select(Arel.star.count.as('count_grouped'))
cte = Gitlab::SQL::CTE.new(:count_cte, count_grouped)
bucket_segments = bucket_size - 1
width_bucket = Arel::Nodes::NamedFunction
.new('WIDTH_BUCKET', [cte.table[:count_grouped], buckets.first, buckets.last, bucket_segments])
.as('buckets')
query = cte
.table
.project(width_bucket, cte.table[:count])
.group('buckets')
.order('buckets')
.with(cte.to_arel)
query.to_sql
end
# rubocop: enable CodeReuse/ActiveRecord
def raw_sql(relation, column, distinct = false)
column ||= relation.primary_key
relation.select(relation.all.table[column].count(distinct)).to_sql
end
end
end
end
end
end
...@@ -6,43 +6,20 @@ module Gitlab ...@@ -6,43 +6,20 @@ module Gitlab
class UsageDataQueries < UsageData class UsageDataQueries < UsageData
class << self class << self
def count(relation, column = nil, *args, **kwargs) def count(relation, column = nil, *args, **kwargs)
raw_sql(relation, column) Gitlab::Usage::Metrics::Query.for(:count, relation, column)
end end
def distinct_count(relation, column = nil, *args, **kwargs) def distinct_count(relation, column = nil, *args, **kwargs)
raw_sql(relation, column, :distinct) Gitlab::Usage::Metrics::Query.for(:distinct_count, relation, column)
end
def redis_usage_data(counter = nil, &block)
if block_given?
{ redis_usage_data_block: block.to_s }
elsif counter.present?
{ redis_usage_data_counter: counter }
end
end end
def sum(relation, column, *args, **kwargs) def sum(relation, column, *args, **kwargs)
relation.select(relation.all.table[column].sum).to_sql Gitlab::Usage::Metrics::Query.for(:sum, relation, column)
end end
# rubocop: disable CodeReuse/ActiveRecord # rubocop: disable CodeReuse/ActiveRecord
def histogram(relation, column, buckets:, bucket_size: buckets.size) def histogram(relation, column, buckets:, bucket_size: buckets.size)
count_grouped = relation.group(column).select(Arel.star.count.as('count_grouped')) Gitlab::Usage::Metrics::Query.for(:histogram, relation, column, buckets: buckets, bucket_size: bucket_size)
cte = Gitlab::SQL::CTE.new(:count_cte, count_grouped)
bucket_segments = bucket_size - 1
width_bucket = Arel::Nodes::NamedFunction
.new('WIDTH_BUCKET', [cte.table[:count_grouped], buckets.first, buckets.last, bucket_segments])
.as('buckets')
query = cte
.table
.project(width_bucket, cte.table[:count])
.group('buckets')
.order('buckets')
.with(cte.to_arel)
query.to_sql
end end
# rubocop: enable CodeReuse/ActiveRecord # rubocop: enable CodeReuse/ActiveRecord
...@@ -50,11 +27,11 @@ module Gitlab ...@@ -50,11 +27,11 @@ module Gitlab
# buckets query, because it can't be used to obtain estimations without # buckets query, because it can't be used to obtain estimations without
# supplementary ruby code present in Gitlab::Database::PostgresHll::BatchDistinctCounter # supplementary ruby code present in Gitlab::Database::PostgresHll::BatchDistinctCounter
def estimate_batch_distinct_count(relation, column = nil, *args, **kwargs) def estimate_batch_distinct_count(relation, column = nil, *args, **kwargs)
raw_sql(relation, column, :distinct) Gitlab::Usage::Metrics::Query.for(:estimate_batch_distinct_count, relation, column)
end end
def add(*args) def add(*args)
'SELECT ' + args.map {|arg| "(#{arg})" }.join(' + ') 'SELECT ' + args.map { |arg| "(#{arg})" }.join(' + ')
end end
def maximum_id(model, column = nil) def maximum_id(model, column = nil)
...@@ -63,6 +40,14 @@ module Gitlab ...@@ -63,6 +40,14 @@ module Gitlab
def minimum_id(model, column = nil) def minimum_id(model, column = nil)
end end
def redis_usage_data(counter = nil, &block)
if block_given?
{ redis_usage_data_block: block.to_s }
elsif counter.present?
{ redis_usage_data_counter: counter }
end
end
def jira_service_data def jira_service_data
{ {
projects_jira_server_active: 0, projects_jira_server_active: 0,
...@@ -73,13 +58,6 @@ module Gitlab ...@@ -73,13 +58,6 @@ module Gitlab
def epics_deepest_relationship_level def epics_deepest_relationship_level
{ epics_deepest_relationship_level: 0 } { epics_deepest_relationship_level: 0 }
end end
private
def raw_sql(relation, column, distinct = nil)
column ||= relation.primary_key
relation.select(relation.all.table[column].count(distinct)).to_sql
end
end end
end end
end end
...@@ -5,5 +5,8 @@ require 'spec_helper' ...@@ -5,5 +5,8 @@ require 'spec_helper'
RSpec.describe Gitlab::Usage::Metrics::Instrumentations::CountBoardsMetric do RSpec.describe Gitlab::Usage::Metrics::Instrumentations::CountBoardsMetric do
let_it_be(:board) { create(:board) } let_it_be(:board) { create(:board) }
it_behaves_like 'a correct instrumented metric value', { time_frame: 'all', data_source: 'database' }, 1 let(:expected_value) { 1 }
let(:expected_query) { 'SELECT COUNT("boards"."id") FROM "boards"' }
it_behaves_like 'a correct instrumented metric value and query', { time_frame: 'all' }
end end
...@@ -5,5 +5,8 @@ require 'spec_helper' ...@@ -5,5 +5,8 @@ require 'spec_helper'
RSpec.describe Gitlab::Usage::Metrics::Instrumentations::CountIssuesMetric do RSpec.describe Gitlab::Usage::Metrics::Instrumentations::CountIssuesMetric do
let_it_be(:issue) { create(:issue) } let_it_be(:issue) { create(:issue) }
it_behaves_like 'a correct instrumented metric value', { time_frame: 'all', data_source: 'database' }, 1 let(:expected_value) { 1 }
let(:expected_query) { 'SELECT COUNT("issues"."id") FROM "issues"' }
it_behaves_like 'a correct instrumented metric value and query', { time_frame: 'all' }
end end
...@@ -8,10 +8,18 @@ RSpec.describe Gitlab::Usage::Metrics::Instrumentations::CountUsersCreatingIssue ...@@ -8,10 +8,18 @@ RSpec.describe Gitlab::Usage::Metrics::Instrumentations::CountUsersCreatingIssue
let_it_be(:old_issue) { create(:issue, author: author, created_at: 2.months.ago) } let_it_be(:old_issue) { create(:issue, author: author, created_at: 2.months.ago) }
context 'with all time frame' do context 'with all time frame' do
it_behaves_like 'a correct instrumented metric value', { time_frame: 'all', data_source: 'database' }, 1 let(:expected_value) { 1 }
let(:expected_query) { 'SELECT COUNT(DISTINCT "issues"."author_id") FROM "issues"' }
it_behaves_like 'a correct instrumented metric value and query', { time_frame: 'all' }
end end
context 'for 28d time frame' do context 'for 28d time frame' do
it_behaves_like 'a correct instrumented metric value', { time_frame: '28d', data_source: 'database' }, 1 let(:expected_value) { 1 }
let(:start) { 30.days.ago.to_s(:db) }
let(:finish) { 2.days.ago.to_s(:db) }
let(:expected_query) { "SELECT COUNT(DISTINCT \"issues\".\"author_id\") FROM \"issues\" WHERE \"issues\".\"created_at\" BETWEEN '#{start}' AND '#{finish}'" }
it_behaves_like 'a correct instrumented metric value and query', { time_frame: '28d' }
end end
end end
...@@ -3,5 +3,7 @@ ...@@ -3,5 +3,7 @@
require 'spec_helper' require 'spec_helper'
RSpec.describe Gitlab::Usage::Metrics::Instrumentations::HostnameMetric do RSpec.describe Gitlab::Usage::Metrics::Instrumentations::HostnameMetric do
it_behaves_like 'a correct instrumented metric value', { time_frame: 'none', data_source: 'ruby' }, Gitlab.config.gitlab.host let(:expected_value) { Gitlab.config.gitlab.host }
it_behaves_like 'a correct instrumented metric value', { time_frame: 'none' }
end end
...@@ -10,10 +10,19 @@ RSpec.describe Gitlab::Usage::Metrics::Instrumentations::RedisHLLMetric, :clean_ ...@@ -10,10 +10,19 @@ RSpec.describe Gitlab::Usage::Metrics::Instrumentations::RedisHLLMetric, :clean_
Gitlab::UsageDataCounters::HLLRedisCounter.track_event(:i_quickactions_approve, values: 2, time: 2.months.ago) Gitlab::UsageDataCounters::HLLRedisCounter.track_event(:i_quickactions_approve, values: 2, time: 2.months.ago)
end end
it_behaves_like 'a correct instrumented metric value', { time_frame: '28d', options: { events: ['i_quickactions_approve'] } }, 2 context 'for 28d' do
it_behaves_like 'a correct instrumented metric value', { time_frame: '7d', options: { events: ['i_quickactions_approve'] } }, 1 let(:expected_value) { 2 }
it 'raise exception if vents options is not present' do it_behaves_like 'a correct instrumented metric value', { time_frame: '28d', options: { events: ['i_quickactions_approve'] } }
end
context 'for 7d' do
let(:expected_value) { 1 }
it_behaves_like 'a correct instrumented metric value', { time_frame: '7d', options: { events: ['i_quickactions_approve'] } }
end
it 'raise exception if events options is not present' do
expect { described_class.new(time_frame: '28d') }.to raise_error(ArgumentError) expect { described_class.new(time_frame: '28d') }.to raise_error(ArgumentError)
end end
end end
...@@ -3,5 +3,7 @@ ...@@ -3,5 +3,7 @@
require 'spec_helper' require 'spec_helper'
RSpec.describe Gitlab::Usage::Metrics::Instrumentations::UuidMetric do RSpec.describe Gitlab::Usage::Metrics::Instrumentations::UuidMetric do
it_behaves_like 'a correct instrumented metric value', { time_frame: 'none' }, Gitlab::CurrentSettings.uuid let(:expected_value) { Gitlab::CurrentSettings.uuid }
it_behaves_like 'a correct instrumented metric value', { time_frame: 'none' }
end end
# frozen_string_literal: true
require 'spec_helper'
RSpec.describe Gitlab::Usage::Metrics::Query do
describe '.count' do
it 'returns the raw SQL' do
expect(described_class.for(:count, User)).to eq('SELECT COUNT("users"."id") FROM "users"')
end
it 'does not mix a nil column with keyword arguments' do
expect(described_class.for(:count, User, nil)).to eq('SELECT COUNT("users"."id") FROM "users"')
end
end
describe '.distinct_count' do
it 'returns the raw SQL' do
expect(described_class.for(:distinct_count, Issue, :author_id)).to eq('SELECT COUNT(DISTINCT "issues"."author_id") FROM "issues"')
end
it 'does not mix a nil column with keyword arguments' do
expect(described_class.for(:distinct_count, Issue, nil)).to eq('SELECT COUNT(DISTINCT "issues"."id") FROM "issues"')
end
end
describe '.sum' do
it 'returns the raw SQL' do
expect(described_class.for(:sum, Issue, :weight)).to eq('SELECT SUM("issues"."weight") FROM "issues"')
end
end
describe 'estimate_batch_distinct_count' do
it 'returns the raw SQL' do
expect(described_class.for(:estimate_batch_distinct_count, Issue, :author_id)).to eq('SELECT COUNT(DISTINCT "issues"."author_id") FROM "issues"')
end
end
describe '.histogram' do
it 'returns the histogram sql' do
expect(described_class.for(:histogram, AlertManagement::HttpIntegration.active,
:project_id, buckets: 1..2, bucket_size: 101))
.to match(/^WITH "count_cte" AS #{Gitlab::Database::AsWithMaterialized.materialized_if_supported}/)
end
end
describe 'other' do
it 'raise ArgumentError error' do
expect { described_class.for(:other, nil) }.to raise_error(ArgumentError, 'other operation not supported')
end
end
end
...@@ -13,9 +13,7 @@ RSpec.describe Gitlab::UsageDataQueries do ...@@ -13,9 +13,7 @@ RSpec.describe Gitlab::UsageDataQueries do
end end
it 'does not mix a nil column with keyword arguments' do it 'does not mix a nil column with keyword arguments' do
expect(described_class).to receive(:raw_sql).with(User, nil) expect(described_class.count(User, nil)).to eq('SELECT COUNT("users"."id") FROM "users"')
described_class.count(User, start: 1, finish: 2)
end end
end end
...@@ -25,9 +23,7 @@ RSpec.describe Gitlab::UsageDataQueries do ...@@ -25,9 +23,7 @@ RSpec.describe Gitlab::UsageDataQueries do
end end
it 'does not mix a nil column with keyword arguments' do it 'does not mix a nil column with keyword arguments' do
expect(described_class).to receive(:raw_sql).with(Issue, nil, :distinct) expect(described_class.distinct_count(Issue, nil, start: 1, finish: 2)).to eq('SELECT COUNT(DISTINCT "issues"."id") FROM "issues"')
described_class.distinct_count(Issue, nil, start: 1, finish: 2)
end end
end end
......
# frozen_string_literal: true # frozen_string_literal: true
RSpec.shared_examples 'a correct instrumented metric value' do |params, expected_value| RSpec.shared_examples 'a correct instrumented metric value' do |params|
let(:time_frame) { params[:time_frame] } let(:time_frame) { params[:time_frame] }
let(:options) { params[:options] } let(:options) { params[:options] }
let(:metric) { described_class.new(time_frame: time_frame, options: options) }
before do before do
allow(ActiveRecord::Base.connection).to receive(:transaction_open?).and_return(false) allow(ActiveRecord::Base.connection).to receive(:transaction_open?).and_return(false)
end end
it 'has correct value' do it 'has correct value' do
expect(described_class.new(time_frame: time_frame, options: options).value).to eq(expected_value) expect(metric.value).to eq(expected_value)
end end
end end
RSpec.shared_examples 'a correct instrumented metric query' do |params|
let(:time_frame) { params[:time_frame] }
let(:options) { params[:options] }
let(:metric) { described_class.new(time_frame: time_frame, options: options) }
around do |example|
freeze_time { example.run }
end
before do
allow(ActiveRecord::Base.connection).to receive(:transaction_open?).and_return(false)
end
it 'has correct generate query' do
expect(metric.to_sql).to eq(expected_query)
end
end
RSpec.shared_examples 'a correct instrumented metric value and query' do |params|
it_behaves_like 'a correct instrumented metric value', params
it_behaves_like 'a correct instrumented metric query', params
end
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment