debian-mirror-gitlab/app/services/ci/destroy_expired_job_artifacts_service.rb

90 lines
2.8 KiB
Ruby
Raw Normal View History

2019-03-02 22:35:43 +05:30
# frozen_string_literal: true
module Ci
class DestroyExpiredJobArtifactsService
include ::Gitlab::ExclusiveLeaseHelpers
include ::Gitlab::LoopHelpers
2021-01-29 00:20:46 +05:30
include ::Gitlab::Utils::StrongMemoize
2019-03-02 22:35:43 +05:30
BATCH_SIZE = 100
2021-01-29 00:20:46 +05:30
LOOP_TIMEOUT = 5.minutes
2019-03-02 22:35:43 +05:30
LOOP_LIMIT = 1000
EXCLUSIVE_LOCK_KEY = 'expired_job_artifacts:destroy:lock'
2021-01-29 00:20:46 +05:30
LOCK_TIMEOUT = 6.minutes
2019-03-02 22:35:43 +05:30
2021-03-08 18:12:59 +05:30
def initialize
@removed_artifacts_count = 0
end
2019-03-02 22:35:43 +05:30
##
# Destroy expired job artifacts on GitLab instance
#
2021-01-29 00:20:46 +05:30
# This destroy process cannot run for more than 6 minutes. This is for
2019-03-02 22:35:43 +05:30
# preventing multiple `ExpireBuildArtifactsWorker` CRON jobs run concurrently,
2021-01-29 00:20:46 +05:30
# which is scheduled every 7 minutes.
2019-03-02 22:35:43 +05:30
def execute
in_lock(EXCLUSIVE_LOCK_KEY, ttl: LOCK_TIMEOUT, retries: 1) do
2021-03-08 18:12:59 +05:30
destroy_job_artifacts_with_slow_iteration(Time.current)
2019-03-02 22:35:43 +05:30
end
2021-03-08 18:12:59 +05:30
@removed_artifacts_count
2021-01-29 00:20:46 +05:30
end
2021-03-08 18:12:59 +05:30
private
2019-03-02 22:35:43 +05:30
2021-03-08 18:12:59 +05:30
def destroy_job_artifacts_with_slow_iteration(start_at)
Ci::JobArtifact.expired_before(start_at).each_batch(of: BATCH_SIZE, column: :expire_at, order: :desc) do |relation, index|
artifacts = relation.unlocked.with_destroy_preloads.to_a
2021-01-03 14:25:43 +05:30
2021-03-08 18:12:59 +05:30
parallel_destroy_batch(artifacts) if artifacts.any?
break if loop_timeout?(start_at)
break if index >= LOOP_LIMIT
end
2021-01-29 00:20:46 +05:30
end
def parallel_destroy_batch(job_artifacts)
Ci::DeletedObject.transaction do
Ci::DeletedObject.bulk_import(job_artifacts)
Ci::JobArtifact.id_in(job_artifacts.map(&:id)).delete_all
destroy_related_records_for(job_artifacts)
end
# This is executed outside of the transaction because it depends on Redis
2021-03-08 18:12:59 +05:30
update_project_statistics_for(job_artifacts)
increment_monitoring_statistics(job_artifacts.size)
2021-01-29 00:20:46 +05:30
end
# This method is implemented in EE and it must do only database work
def destroy_related_records_for(job_artifacts); end
2021-03-08 18:12:59 +05:30
def update_project_statistics_for(job_artifacts)
2021-01-29 00:20:46 +05:30
artifacts_by_project = job_artifacts.group_by(&:project)
artifacts_by_project.each do |project, artifacts|
delta = -artifacts.sum { |artifact| artifact.size.to_i }
ProjectStatistics.increment_statistic(
project, Ci::JobArtifact.project_statistics_name, delta)
end
2019-03-02 22:35:43 +05:30
end
2021-01-03 14:25:43 +05:30
2021-03-08 18:12:59 +05:30
def increment_monitoring_statistics(size)
destroyed_artifacts_counter.increment({}, size)
@removed_artifacts_count += size
end
2021-01-29 00:20:46 +05:30
def destroyed_artifacts_counter
strong_memoize(:destroyed_artifacts_counter) do
name = :destroyed_job_artifacts_count_total
comment = 'Counter of destroyed expired job artifacts'
::Gitlab::Metrics.counter(name, comment)
end
end
2021-03-08 18:12:59 +05:30
def loop_timeout?(start_at)
Time.current > start_at + LOOP_TIMEOUT
end
2019-03-02 22:35:43 +05:30
end
end
2021-01-03 14:25:43 +05:30
Ci::DestroyExpiredJobArtifactsService.prepend_if_ee('EE::Ci::DestroyExpiredJobArtifactsService')