Commit e51d2609 authored by Piotr Skorupa's avatar Piotr Skorupa

Add TimeFrame module for metric time periods SSOT

parent 1a6bb212
This diff is collapsed.
...@@ -22,9 +22,7 @@ module Gitlab ...@@ -22,9 +22,7 @@ module Gitlab
}.freeze }.freeze
class Aggregate class Aggregate
delegate :weekly_time_range, include Gitlab::Usage::TimeFrame
:monthly_time_range,
to: Gitlab::Utils::UsageData
def initialize(recorded_at) def initialize(recorded_at)
@aggregated_metrics = load_metrics(AGGREGATED_METRICS_PATH) @aggregated_metrics = load_metrics(AGGREGATED_METRICS_PATH)
...@@ -32,15 +30,15 @@ module Gitlab ...@@ -32,15 +30,15 @@ module Gitlab
end end
def all_time_data def all_time_data
aggregated_metrics_data(start_date: nil, end_date: nil, time_frame: Gitlab::Utils::UsageData::ALL_TIME_TIME_FRAME_NAME) aggregated_metrics_data(start_date: nil, end_date: nil, time_frame: Gitlab::Usage::TimeFrame::ALL_TIME_TIME_FRAME_NAME)
end end
def monthly_data def monthly_data
aggregated_metrics_data(**monthly_time_range.merge(time_frame: Gitlab::Utils::UsageData::TWENTY_EIGHT_DAYS_TIME_FRAME_NAME)) aggregated_metrics_data(**monthly_time_range.merge(time_frame: Gitlab::Usage::TimeFrame::TWENTY_EIGHT_DAYS_TIME_FRAME_NAME))
end end
def weekly_data def weekly_data
aggregated_metrics_data(**weekly_time_range.merge(time_frame: Gitlab::Utils::UsageData::SEVEN_DAYS_TIME_FRAME_NAME)) aggregated_metrics_data(**weekly_time_range.merge(time_frame: Gitlab::Usage::TimeFrame::SEVEN_DAYS_TIME_FRAME_NAME))
end end
private private
...@@ -54,7 +52,7 @@ module Gitlab ...@@ -54,7 +52,7 @@ module Gitlab
case aggregation[:source] case aggregation[:source]
when REDIS_SOURCE when REDIS_SOURCE
if time_frame == Gitlab::Utils::UsageData::ALL_TIME_TIME_FRAME_NAME if time_frame == Gitlab::Usage::TimeFrame::ALL_TIME_TIME_FRAME_NAME
data[aggregation[:name]] = Gitlab::Utils::UsageData::FALLBACK data[aggregation[:name]] = Gitlab::Utils::UsageData::FALLBACK
Gitlab::ErrorTracking Gitlab::ErrorTracking
.track_and_raise_for_dev_exception( .track_and_raise_for_dev_exception(
......
...@@ -56,15 +56,15 @@ module Gitlab ...@@ -56,15 +56,15 @@ module Gitlab
end end
def time_period_to_human_name(time_period) def time_period_to_human_name(time_period)
return Gitlab::Utils::UsageData::ALL_TIME_TIME_FRAME_NAME if time_period.blank? return Gitlab::Usage::TimeFrame::ALL_TIME_TIME_FRAME_NAME if time_period.blank?
start_date = time_period.first.to_date start_date = time_period.first.to_date
end_date = time_period.last.to_date end_date = time_period.last.to_date
if (end_date - start_date).to_i > 7 if (end_date - start_date).to_i > 7
Gitlab::Utils::UsageData::TWENTY_EIGHT_DAYS_TIME_FRAME_NAME Gitlab::Usage::TimeFrame::TWENTY_EIGHT_DAYS_TIME_FRAME_NAME
else else
Gitlab::Utils::UsageData::SEVEN_DAYS_TIME_FRAME_NAME Gitlab::Usage::TimeFrame::SEVEN_DAYS_TIME_FRAME_NAME
end end
end end
end end
......
...@@ -6,6 +6,7 @@ module Gitlab ...@@ -6,6 +6,7 @@ module Gitlab
module Instrumentations module Instrumentations
class BaseMetric class BaseMetric
include Gitlab::Utils::UsageData include Gitlab::Utils::UsageData
include Gitlab::Usage::TimeFrame
attr_reader :time_frame attr_reader :time_frame
attr_reader :options attr_reader :options
......
...@@ -52,7 +52,7 @@ module Gitlab ...@@ -52,7 +52,7 @@ module Gitlab
def time_constraints def time_constraints
case time_frame case time_frame
when '28d' when '28d'
{ created_at: 30.days.ago..2.days.ago } monthly_time_range_db_params
when 'all' when 'all'
{} {}
when 'none' when 'none'
......
...@@ -35,9 +35,9 @@ module Gitlab ...@@ -35,9 +35,9 @@ module Gitlab
def time_constraints def time_constraints
case time_frame case time_frame
when '28d' when '28d'
{ start_date: 4.weeks.ago.to_date, end_date: Date.current } monthly_time_range
when '7d' when '7d'
{ start_date: 7.days.ago.to_date, end_date: Date.current } weekly_time_range
else else
raise "Unknown time frame: #{time_frame} for RedisHLLMetric" raise "Unknown time frame: #{time_frame} for RedisHLLMetric"
end end
......
# frozen_string_literal: true
module Gitlab
module Usage
module TimeFrame
ALL_TIME_TIME_FRAME_NAME = "all"
SEVEN_DAYS_TIME_FRAME_NAME = "7d"
TWENTY_EIGHT_DAYS_TIME_FRAME_NAME = "28d"
def weekly_time_range
{ start_date: 7.days.ago.to_date, end_date: Date.current }
end
def monthly_time_range
{ start_date: 4.weeks.ago.to_date, end_date: Date.current }
end
# This time range is skewed for batch counter performance.
# See https://gitlab.com/gitlab-org/gitlab/-/merge_requests/42972
def monthly_time_range_db_params(column: :created_at)
{ column => 30.days.ago..2.days.ago }
end
end
end
end
...@@ -33,6 +33,7 @@ module Gitlab ...@@ -33,6 +33,7 @@ module Gitlab
class << self class << self
include Gitlab::Utils::UsageData include Gitlab::Utils::UsageData
include Gitlab::Utils::StrongMemoize include Gitlab::Utils::StrongMemoize
include Gitlab::Usage::TimeFrame
def data(force_refresh: false) def data(force_refresh: false)
Rails.cache.fetch('usage_data', force: force_refresh, expires_in: 2.weeks) do Rails.cache.fetch('usage_data', force: force_refresh, expires_in: 2.weeks) do
...@@ -55,7 +56,7 @@ module Gitlab ...@@ -55,7 +56,7 @@ module Gitlab
.merge(object_store_usage_data) .merge(object_store_usage_data)
.merge(topology_usage_data) .merge(topology_usage_data)
.merge(usage_activity_by_stage) .merge(usage_activity_by_stage)
.merge(usage_activity_by_stage(:usage_activity_by_stage_monthly, last_28_days_time_period)) .merge(usage_activity_by_stage(:usage_activity_by_stage_monthly, monthly_time_range_db_params))
.merge(analytics_unique_visits_data) .merge(analytics_unique_visits_data)
.merge(compliance_unique_visits_data) .merge(compliance_unique_visits_data)
.merge(search_unique_visits_data) .merge(search_unique_visits_data)
...@@ -228,17 +229,17 @@ module Gitlab ...@@ -228,17 +229,17 @@ module Gitlab
{ {
counts_monthly: { counts_monthly: {
# rubocop: disable UsageData/LargeTable: # rubocop: disable UsageData/LargeTable:
deployments: deployment_count(Deployment.where(last_28_days_time_period)), deployments: deployment_count(Deployment.where(monthly_time_range_db_params)),
successful_deployments: deployment_count(Deployment.success.where(last_28_days_time_period)), successful_deployments: deployment_count(Deployment.success.where(monthly_time_range_db_params)),
failed_deployments: deployment_count(Deployment.failed.where(last_28_days_time_period)), failed_deployments: deployment_count(Deployment.failed.where(monthly_time_range_db_params)),
# rubocop: enable UsageData/LargeTable: # rubocop: enable UsageData/LargeTable:
projects: count(Project.where(last_28_days_time_period), start: minimum_id(Project), finish: maximum_id(Project)), projects: count(Project.where(monthly_time_range_db_params), start: minimum_id(Project), finish: maximum_id(Project)),
packages: count(::Packages::Package.where(last_28_days_time_period)), packages: count(::Packages::Package.where(monthly_time_range_db_params)),
personal_snippets: count(PersonalSnippet.where(last_28_days_time_period)), personal_snippets: count(PersonalSnippet.where(monthly_time_range_db_params)),
project_snippets: count(ProjectSnippet.where(last_28_days_time_period)), project_snippets: count(ProjectSnippet.where(monthly_time_range_db_params)),
projects_with_alerts_created: distinct_count(::AlertManagement::Alert.where(last_28_days_time_period), :project_id) projects_with_alerts_created: distinct_count(::AlertManagement::Alert.where(monthly_time_range_db_params), :project_id)
}.merge( }.merge(
snowplow_event_counts(last_28_days_time_period(column: :collector_tstamp)) snowplow_event_counts(monthly_time_range_db_params(column: :collector_tstamp))
).tap do |data| ).tap do |data|
data[:snippets] = add(data[:personal_snippets], data[:project_snippets]) data[:snippets] = add(data[:personal_snippets], data[:project_snippets])
end end
...@@ -522,10 +523,6 @@ module Gitlab ...@@ -522,10 +523,6 @@ module Gitlab
"#{platform}-#{ohai_data['platform_version']}" "#{platform}-#{ohai_data['platform_version']}"
end end
def last_28_days_time_period(column: :created_at)
{ column => batch_counter_monthly_time_range[:start_date]..batch_counter_monthly_time_range[:end_date] }
end
# Source: https://gitlab.com/gitlab-data/analytics/blob/master/transform/snowflake-dbt/data/ping_metrics_to_stage_mapping_data.csv # Source: https://gitlab.com/gitlab-data/analytics/blob/master/transform/snowflake-dbt/data/ping_metrics_to_stage_mapping_data.csv
def usage_activity_by_stage(key = :usage_activity_by_stage, time_period = {}) def usage_activity_by_stage(key = :usage_activity_by_stage, time_period = {})
{ {
......
...@@ -38,6 +38,7 @@ module Gitlab ...@@ -38,6 +38,7 @@ module Gitlab
# * Get unique counts per user: Gitlab::UsageDataCounters::HLLRedisCounter.unique_events(event_names: 'g_compliance_dashboard', start_date: 28.days.ago, end_date: Date.current) # * Get unique counts per user: Gitlab::UsageDataCounters::HLLRedisCounter.unique_events(event_names: 'g_compliance_dashboard', start_date: 28.days.ago, end_date: Date.current)
class << self class << self
include Gitlab::Utils::UsageData include Gitlab::Utils::UsageData
include Gitlab::Usage::TimeFrame
# Track unique events # Track unique events
# #
......
...@@ -42,25 +42,8 @@ module Gitlab ...@@ -42,25 +42,8 @@ module Gitlab
FALLBACK = -1 FALLBACK = -1
HISTOGRAM_FALLBACK = { '-1' => -1 }.freeze HISTOGRAM_FALLBACK = { '-1' => -1 }.freeze
DISTRIBUTED_HLL_FALLBACK = -2 DISTRIBUTED_HLL_FALLBACK = -2
ALL_TIME_TIME_FRAME_NAME = "all"
SEVEN_DAYS_TIME_FRAME_NAME = "7d"
TWENTY_EIGHT_DAYS_TIME_FRAME_NAME = "28d"
MAX_BUCKET_SIZE = 100 MAX_BUCKET_SIZE = 100
def weekly_time_range
{ start_date: 7.days.ago.to_date, end_date: Date.current }
end
def monthly_time_range
{ start_date: 4.weeks.ago.to_date, end_date: Date.current }
end
# This time range is skewed for batch counter performance.
# See https://gitlab.com/gitlab-org/gitlab/-/merge_requests/42972
def batch_counter_monthly_time_range
{ start_date: 30.days.ago.to_date, end_date: 2.days.ago.to_date }
end
def count(relation, column = nil, batch: true, batch_size: nil, start: nil, finish: nil) def count(relation, column = nil, batch: true, batch_size: nil, start: nil, finish: nil)
if batch if batch
Gitlab::Database::BatchCount.batch_count(relation, column, batch_size: batch_size, start: start, finish: finish) Gitlab::Database::BatchCount.batch_count(relation, column, batch_size: batch_size, start: start, finish: finish)
......
...@@ -25,9 +25,9 @@ RSpec.describe 'aggregated metrics' do ...@@ -25,9 +25,9 @@ RSpec.describe 'aggregated metrics' do
RSpec::Matchers.define :have_known_time_frame do RSpec::Matchers.define :have_known_time_frame do
allowed_time_frames = [ allowed_time_frames = [
Gitlab::Utils::UsageData::ALL_TIME_TIME_FRAME_NAME, Gitlab::Usage::TimeFrame::ALL_TIME_TIME_FRAME_NAME,
Gitlab::Utils::UsageData::TWENTY_EIGHT_DAYS_TIME_FRAME_NAME, Gitlab::Usage::TimeFrame::TWENTY_EIGHT_DAYS_TIME_FRAME_NAME,
Gitlab::Utils::UsageData::SEVEN_DAYS_TIME_FRAME_NAME Gitlab::Usage::TimeFrame::SEVEN_DAYS_TIME_FRAME_NAME
] ]
match do |aggregate| match do |aggregate|
...@@ -63,7 +63,7 @@ RSpec.describe 'aggregated metrics' do ...@@ -63,7 +63,7 @@ RSpec.describe 'aggregated metrics' do
let_it_be(:events_records) { known_events.select { |event| aggregate[:events].include?(event[:name]) } } let_it_be(:events_records) { known_events.select { |event| aggregate[:events].include?(event[:name]) } }
it "does not include 'all' time frame for Redis sourced aggregate" do it "does not include 'all' time frame for Redis sourced aggregate" do
expect(aggregate[:time_frame]).not_to include(Gitlab::Utils::UsageData::ALL_TIME_TIME_FRAME_NAME) expect(aggregate[:time_frame]).not_to include(Gitlab::Usage::TimeFrame::ALL_TIME_TIME_FRAME_NAME)
end end
it "only refers to known events" do it "only refers to known events" do
......
...@@ -91,7 +91,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do ...@@ -91,7 +91,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do
expect(described_class.usage_activity_by_stage_package({})).to eq( expect(described_class.usage_activity_by_stage_package({})).to eq(
projects_with_packages: 2 projects_with_packages: 2
) )
expect(described_class.usage_activity_by_stage_package(described_class.last_28_days_time_period)).to eq( expect(described_class.usage_activity_by_stage_package(described_class.monthly_time_range_db_params)).to eq(
projects_with_packages: 1 projects_with_packages: 1
) )
end end
...@@ -135,7 +135,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do ...@@ -135,7 +135,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do
project_clusters_disabled: 2, project_clusters_disabled: 2,
project_clusters_enabled: 10 project_clusters_enabled: 10
) )
expect(described_class.usage_activity_by_stage_configure(described_class.last_28_days_time_period)).to include( expect(described_class.usage_activity_by_stage_configure(described_class.monthly_time_range_db_params)).to include(
clusters_applications_cert_managers: 1, clusters_applications_cert_managers: 1,
clusters_applications_helm: 1, clusters_applications_helm: 1,
clusters_applications_ingress: 1, clusters_applications_ingress: 1,
...@@ -185,7 +185,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do ...@@ -185,7 +185,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do
snippets: 2, snippets: 2,
suggestions: 2 suggestions: 2
) )
expect(described_class.usage_activity_by_stage_create(described_class.last_28_days_time_period)).to include( expect(described_class.usage_activity_by_stage_create(described_class.monthly_time_range_db_params)).to include(
deploy_keys: 1, deploy_keys: 1,
keys: 1, keys: 1,
merge_requests: 1, merge_requests: 1,
...@@ -225,7 +225,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do ...@@ -225,7 +225,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do
omniauth_providers: ['google_oauth2'], omniauth_providers: ['google_oauth2'],
user_auth_by_provider: { 'group_saml' => 2, 'ldap' => 4, 'standard' => 0, 'two-factor' => 0, 'two-factor-via-u2f-device' => 0, "two-factor-via-webauthn-device" => 0 } user_auth_by_provider: { 'group_saml' => 2, 'ldap' => 4, 'standard' => 0, 'two-factor' => 0, 'two-factor-via-u2f-device' => 0, "two-factor-via-webauthn-device" => 0 }
) )
expect(described_class.usage_activity_by_stage_manage(described_class.last_28_days_time_period)).to include( expect(described_class.usage_activity_by_stage_manage(described_class.monthly_time_range_db_params)).to include(
events: 1, events: 1,
groups: 1, groups: 1,
users_created: 3, users_created: 3,
...@@ -252,7 +252,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do ...@@ -252,7 +252,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do
unique_users_all_imports: 10 unique_users_all_imports: 10
) )
expect(described_class.usage_activity_by_stage_manage(described_class.last_28_days_time_period)).to include( expect(described_class.usage_activity_by_stage_manage(described_class.monthly_time_range_db_params)).to include(
unique_users_all_imports: 5 unique_users_all_imports: 5
) )
end end
...@@ -327,7 +327,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do ...@@ -327,7 +327,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do
groups_imported: Gitlab::UsageData::DEPRECATED_VALUE groups_imported: Gitlab::UsageData::DEPRECATED_VALUE
} }
) )
expect(described_class.usage_activity_by_stage_manage(described_class.last_28_days_time_period)).to include( expect(described_class.usage_activity_by_stage_manage(described_class.monthly_time_range_db_params)).to include(
{ {
bulk_imports: { bulk_imports: {
gitlab_v1: 1, gitlab_v1: 1,
...@@ -411,7 +411,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do ...@@ -411,7 +411,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do
projects_with_enabled_alert_integrations_histogram: { '1' => 2 } projects_with_enabled_alert_integrations_histogram: { '1' => 2 }
) )
data_28_days = described_class.usage_activity_by_stage_monitor(described_class.last_28_days_time_period) data_28_days = described_class.usage_activity_by_stage_monitor(described_class.monthly_time_range_db_params)
expect(data_28_days).to include( expect(data_28_days).to include(
clusters: 1, clusters: 1,
clusters_applications_prometheus: 1, clusters_applications_prometheus: 1,
...@@ -450,7 +450,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do ...@@ -450,7 +450,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do
projects_jira_dvcs_cloud_active: 2, projects_jira_dvcs_cloud_active: 2,
projects_jira_dvcs_server_active: 2 projects_jira_dvcs_server_active: 2
) )
expect(described_class.usage_activity_by_stage_plan(described_class.last_28_days_time_period)).to include( expect(described_class.usage_activity_by_stage_plan(described_class.monthly_time_range_db_params)).to include(
issues: 2, issues: 2,
notes: 1, notes: 1,
projects: 1, projects: 1,
...@@ -479,7 +479,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do ...@@ -479,7 +479,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do
releases: 2, releases: 2,
successful_deployments: 2 successful_deployments: 2
) )
expect(described_class.usage_activity_by_stage_release(described_class.last_28_days_time_period)).to include( expect(described_class.usage_activity_by_stage_release(described_class.monthly_time_range_db_params)).to include(
deployments: 1, deployments: 1,
failed_deployments: 1, failed_deployments: 1,
releases: 1, releases: 1,
...@@ -513,7 +513,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do ...@@ -513,7 +513,7 @@ RSpec.describe Gitlab::UsageData, :aggregate_failures do
ci_triggers: 2, ci_triggers: 2,
clusters_applications_runner: 2 clusters_applications_runner: 2
) )
expect(described_class.usage_activity_by_stage_verify(described_class.last_28_days_time_period)).to include( expect(described_class.usage_activity_by_stage_verify(described_class.monthly_time_range_db_params)).to include(
ci_builds: 1, ci_builds: 1,
ci_external_pipelines: 1, ci_external_pipelines: 1,
ci_internal_pipelines: 1, ci_internal_pipelines: 1,
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment