debian-mirror-gitlab/app/models/project_statistics.rb

154 lines
5.1 KiB
Ruby
Raw Normal View History

2018-11-18 11:00:15 +05:30
# frozen_string_literal: true
2019-07-07 11:18:12 +05:30
class ProjectStatistics < ApplicationRecord
2019-09-30 21:07:59 +05:30
include AfterCommitQueue
2021-01-03 14:25:43 +05:30
include CounterAttribute
2019-09-30 21:07:59 +05:30
2017-08-17 22:00:37 +05:30
belongs_to :project
belongs_to :namespace
2019-09-04 21:01:54 +05:30
default_value_for :wiki_size, 0
2020-07-28 23:09:34 +05:30
default_value_for :snippets_size, 0
2019-09-04 21:01:54 +05:30
2021-01-03 14:25:43 +05:30
counter_attribute :build_artifacts_size
counter_attribute :storage_size
counter_attribute_after_flush do |project_statistic|
Namespaces::ScheduleAggregationWorker.perform_async(project_statistic.namespace_id)
end
2017-08-17 22:00:37 +05:30
before_save :update_storage_size
2020-07-28 23:09:34 +05:30
COLUMNS_TO_REFRESH = [:repository_size, :wiki_size, :lfs_objects_size, :commit_count, :snippets_size].freeze
2020-11-24 15:15:51 +05:30
INCREMENTABLE_COLUMNS = {
build_artifacts_size: %i[storage_size],
packages_size: %i[storage_size],
pipeline_artifacts_size: %i[storage_size],
snippets_size: %i[storage_size]
}.freeze
2019-09-30 21:07:59 +05:30
NAMESPACE_RELATABLE_COLUMNS = [:repository_size, :wiki_size, :lfs_objects_size].freeze
2017-08-17 22:00:37 +05:30
2019-09-04 21:01:54 +05:30
scope :for_project_ids, ->(project_ids) { where(project_id: project_ids) }
2020-05-24 23:13:21 +05:30
scope :for_namespaces, -> (namespaces) { where(namespace: namespaces) }
2017-08-17 22:00:37 +05:30
def total_repository_size
repository_size + lfs_objects_size
end
2019-09-30 21:07:59 +05:30
def refresh!(only: [])
2021-01-03 14:25:43 +05:30
return if Gitlab::Database.read_only?
2018-10-15 14:42:47 +05:30
COLUMNS_TO_REFRESH.each do |column, generator|
2019-09-30 21:07:59 +05:30
if only.empty? || only.include?(column)
2018-03-17 18:26:18 +05:30
public_send("update_#{column}") # rubocop:disable GitlabSecurity/PublicSend
2017-08-17 22:00:37 +05:30
end
end
2019-09-30 21:07:59 +05:30
if only.empty? || only.any? { |column| NAMESPACE_RELATABLE_COLUMNS.include?(column) }
schedule_namespace_aggregation_worker
end
2017-08-17 22:00:37 +05:30
save!
end
def update_commit_count
self.commit_count = project.repository.commit_count
end
def update_repository_size
self.repository_size = project.repository.size * 1.megabyte
end
2019-09-04 21:01:54 +05:30
def update_wiki_size
self.wiki_size = project.wiki.repository.size * 1.megabyte
end
2020-07-28 23:09:34 +05:30
def update_snippets_size
self.snippets_size = project.snippets.with_statistics.sum(:repository_size)
end
2017-08-17 22:00:37 +05:30
def update_lfs_objects_size
self.lfs_objects_size = project.lfs_objects.sum(:size)
end
2020-07-28 23:09:34 +05:30
# `wiki_size` and `snippets_size` have no default value in the database
# and the column can be nil.
# This means that, when the columns were added, all rows had nil
# values on them.
# Therefore, any call to any of those methods will return nil instead
# of 0, because `default_value_for` works with new records, not existing ones.
#
# These two methods provide consistency and avoid returning nil.
def wiki_size
super.to_i
end
def snippets_size
super.to_i
2019-07-31 22:56:46 +05:30
end
2018-10-15 14:42:47 +05:30
def update_storage_size
2020-07-28 23:09:34 +05:30
storage_size = repository_size + wiki_size + lfs_objects_size + build_artifacts_size + packages_size
# The `snippets_size` column was added on 20200622095419 but db/post_migrate/20190527194900_schedule_calculate_wiki_sizes.rb
# might try to update project statistics before the `snippets_size` column has been created.
storage_size += snippets_size if self.class.column_names.include?('snippets_size')
2020-11-24 15:15:51 +05:30
# The `pipeline_artifacts_size` column was added on 20200817142800 but db/post_migrate/20190527194900_schedule_calculate_wiki_sizes.rb
# might try to update project statistics before the `pipeline_artifacts_size` column has been created.
storage_size += pipeline_artifacts_size if self.class.column_names.include?('pipeline_artifacts_size')
2020-07-28 23:09:34 +05:30
self.storage_size = storage_size
2017-08-17 22:00:37 +05:30
end
2018-11-18 11:00:15 +05:30
# Since this incremental update method does not call update_storage_size above,
# we have to update the storage_size here as additional column.
# Additional columns are updated depending on key => [columns], which allows
# to update statistics which are and also those which aren't included in storage_size
# or any other additional summary column in the future.
2021-01-03 14:25:43 +05:30
def self.increment_statistic(project, key, amount)
2018-11-18 11:00:15 +05:30
raise ArgumentError, "Cannot increment attribute: #{key}" unless INCREMENTABLE_COLUMNS.key?(key)
2018-10-15 14:42:47 +05:30
return if amount == 0
2021-01-03 14:25:43 +05:30
project.statistics.try do |project_statistics|
if project_statistics.counter_attribute_enabled?(key)
statistics_to_increment = [key] + INCREMENTABLE_COLUMNS[key].to_a
statistics_to_increment.each do |statistic|
project_statistics.delayed_increment_counter(statistic, amount)
end
else
legacy_increment_statistic(project, key, amount)
end
end
end
def self.legacy_increment_statistic(project, key, amount)
where(project_id: project.id).columns_to_increment(key, amount)
Namespaces::ScheduleAggregationWorker.perform_async( # rubocop: disable CodeReuse/Worker
project.namespace_id)
2018-11-18 11:00:15 +05:30
end
def self.columns_to_increment(key, amount)
updates = ["#{key} = COALESCE(#{key}, 0) + (#{amount})"]
if (additional = INCREMENTABLE_COLUMNS[key])
additional.each do |column|
updates << "#{column} = COALESCE(#{column}, 0) + (#{amount})"
end
end
update_all(updates.join(', '))
2017-08-17 22:00:37 +05:30
end
2019-09-30 21:07:59 +05:30
private
def schedule_namespace_aggregation_worker
run_after_commit do
Namespaces::ScheduleAggregationWorker.perform_async(project.namespace_id)
end
end
2017-08-17 22:00:37 +05:30
end
2019-12-04 20:38:33 +05:30
ProjectStatistics.prepend_if_ee('EE::ProjectStatistics')