2019-02-15 15:39:39 +05:30
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
module Ci
|
|
|
|
class ArchiveTraceService
|
2019-10-12 21:52:04 +05:30
|
|
|
def execute(job, worker_name:)
|
2021-11-18 22:05:49 +05:30
|
|
|
unless job.trace.archival_attempts_available?
|
|
|
|
Sidekiq.logger.warn(class: worker_name, message: 'The job is out of archival attempts.', job_id: job.id)
|
|
|
|
|
|
|
|
job.trace.attempt_archive_cleanup!
|
|
|
|
return
|
|
|
|
end
|
|
|
|
|
2021-11-11 11:23:49 +05:30
|
|
|
unless job.trace.can_attempt_archival_now?
|
2021-11-18 22:05:49 +05:30
|
|
|
Sidekiq.logger.warn(class: worker_name, message: 'The job can not be archived right now.', job_id: job.id)
|
2021-11-11 11:23:49 +05:30
|
|
|
return
|
|
|
|
end
|
|
|
|
|
2019-10-12 21:52:04 +05:30
|
|
|
# TODO: Remove this logging once we confirmed new live trace architecture is functional.
|
|
|
|
# See https://gitlab.com/gitlab-com/gl-infra/infrastructure/issues/4667.
|
|
|
|
unless job.has_live_trace?
|
|
|
|
Sidekiq.logger.warn(class: worker_name,
|
|
|
|
message: 'The job does not have live trace but going to be archived.',
|
|
|
|
job_id: job.id)
|
|
|
|
return
|
|
|
|
end
|
|
|
|
|
2019-02-15 15:39:39 +05:30
|
|
|
job.trace.archive!
|
2020-11-24 15:15:51 +05:30
|
|
|
job.remove_pending_state!
|
2019-10-12 21:52:04 +05:30
|
|
|
|
|
|
|
# TODO: Remove this logging once we confirmed new live trace architecture is functional.
|
|
|
|
# See https://gitlab.com/gitlab-com/gl-infra/infrastructure/issues/4667.
|
|
|
|
unless job.has_archived_trace?
|
|
|
|
Sidekiq.logger.warn(class: worker_name,
|
|
|
|
message: 'The job does not have archived trace after archiving.',
|
|
|
|
job_id: job.id)
|
|
|
|
end
|
2019-02-15 15:39:39 +05:30
|
|
|
rescue ::Gitlab::Ci::Trace::AlreadyArchivedError
|
|
|
|
# It's already archived, thus we can safely ignore this exception.
|
2021-06-08 01:23:25 +05:30
|
|
|
rescue StandardError => e
|
2021-11-11 11:23:49 +05:30
|
|
|
job.trace.increment_archival_attempts!
|
|
|
|
|
2019-02-15 15:39:39 +05:30
|
|
|
# Tracks this error with application logs, Sentry, and Prometheus.
|
|
|
|
# If `archive!` keeps failing for over a week, that could incur data loss.
|
2021-01-03 14:25:43 +05:30
|
|
|
# (See more https://docs.gitlab.com/ee/administration/job_logs.html#new-incremental-logging-architecture)
|
2019-02-15 15:39:39 +05:30
|
|
|
# In order to avoid interrupting the system, we do not raise an exception here.
|
2019-10-12 21:52:04 +05:30
|
|
|
archive_error(e, job, worker_name)
|
2019-02-15 15:39:39 +05:30
|
|
|
end
|
|
|
|
|
|
|
|
private
|
|
|
|
|
|
|
|
def failed_archive_counter
|
|
|
|
@failed_archive_counter ||=
|
|
|
|
Gitlab::Metrics.counter(:job_trace_archive_failed_total,
|
|
|
|
"Counter of failed attempts of trace archiving")
|
|
|
|
end
|
|
|
|
|
2019-10-12 21:52:04 +05:30
|
|
|
def archive_error(error, job, worker_name)
|
2019-02-15 15:39:39 +05:30
|
|
|
failed_archive_counter.increment
|
2019-10-12 21:52:04 +05:30
|
|
|
|
|
|
|
Sidekiq.logger.warn(class: worker_name,
|
|
|
|
message: "Failed to archive trace. message: #{error.message}.",
|
|
|
|
job_id: job.id)
|
2019-02-15 15:39:39 +05:30
|
|
|
|
2020-01-01 13:55:28 +05:30
|
|
|
Gitlab::ErrorTracking
|
|
|
|
.track_and_raise_for_dev_exception(error,
|
2019-12-04 20:38:33 +05:30
|
|
|
issue_url: 'https://gitlab.com/gitlab-org/gitlab-foss/issues/51502',
|
2020-01-01 13:55:28 +05:30
|
|
|
job_id: job.id )
|
2019-02-15 15:39:39 +05:30
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|