2018-03-17 18:26:18 +05:30
|
|
|
# frozen_string_literal: true
|
|
|
|
|
|
|
|
module Gitlab
|
|
|
|
module GithubImport
|
|
|
|
# AdvanceStageWorker is a worker used by the GitHub importer to wait for a
|
|
|
|
# number of jobs to complete, without blocking a thread. Once all jobs have
|
|
|
|
# been completed this worker will advance the import process to the next
|
|
|
|
# stage.
|
|
|
|
class AdvanceStageWorker
|
|
|
|
include ApplicationWorker
|
|
|
|
|
|
|
|
sidekiq_options dead: false
|
|
|
|
|
|
|
|
INTERVAL = 30.seconds.to_i
|
|
|
|
|
|
|
|
# The number of seconds to wait (while blocking the thread) before
|
2018-12-13 13:39:08 +05:30
|
|
|
# continuing to the next waiter.
|
2018-03-17 18:26:18 +05:30
|
|
|
BLOCKING_WAIT_TIME = 5
|
|
|
|
|
|
|
|
# The known importer stages and their corresponding Sidekiq workers.
|
|
|
|
STAGES = {
|
|
|
|
issues_and_diff_notes: Stage::ImportIssuesAndDiffNotesWorker,
|
|
|
|
notes: Stage::ImportNotesWorker,
|
2018-11-08 19:23:39 +05:30
|
|
|
lfs_objects: Stage::ImportLfsObjectsWorker,
|
2018-03-17 18:26:18 +05:30
|
|
|
finish: Stage::FinishImportWorker
|
|
|
|
}.freeze
|
|
|
|
|
|
|
|
# project_id - The ID of the project being imported.
|
|
|
|
# waiters - A Hash mapping Gitlab::JobWaiter keys to the number of
|
|
|
|
# remaining jobs.
|
|
|
|
# next_stage - The name of the next stage to start when all jobs have been
|
|
|
|
# completed.
|
|
|
|
def perform(project_id, waiters, next_stage)
|
|
|
|
return unless (project = find_project(project_id))
|
|
|
|
|
|
|
|
new_waiters = wait_for_jobs(waiters)
|
|
|
|
|
|
|
|
if new_waiters.empty?
|
|
|
|
# We refresh the import JID here so workers importing individual
|
|
|
|
# resources (e.g. notes) don't have to do this all the time, reducing
|
|
|
|
# the pressure on Redis. We _only_ do this once all jobs are done so
|
|
|
|
# we don't get stuck forever if one or more jobs failed to notify the
|
|
|
|
# JobWaiter.
|
|
|
|
project.refresh_import_jid_expiration
|
|
|
|
|
|
|
|
STAGES.fetch(next_stage.to_sym).perform_async(project_id)
|
|
|
|
else
|
|
|
|
self.class.perform_in(INTERVAL, project_id, new_waiters, next_stage)
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
def wait_for_jobs(waiters)
|
|
|
|
waiters.each_with_object({}) do |(key, remaining), new_waiters|
|
|
|
|
waiter = JobWaiter.new(remaining, key)
|
|
|
|
|
|
|
|
# We wait for a brief moment of time so we don't reschedule if we can
|
|
|
|
# complete the work fast enough.
|
|
|
|
waiter.wait(BLOCKING_WAIT_TIME)
|
|
|
|
|
|
|
|
next unless waiter.jobs_remaining.positive?
|
|
|
|
|
|
|
|
new_waiters[waiter.key] = waiter.jobs_remaining
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2018-12-05 23:21:45 +05:30
|
|
|
# rubocop: disable CodeReuse/ActiveRecord
|
2018-03-17 18:26:18 +05:30
|
|
|
def find_project(id)
|
2018-10-15 14:42:47 +05:30
|
|
|
# TODO: Only select the JID
|
|
|
|
# This is due to the fact that the JID could be present in either the project record or
|
|
|
|
# its associated import_state record
|
|
|
|
Project.import_started.find_by(id: id)
|
2018-03-17 18:26:18 +05:30
|
|
|
end
|
2018-12-05 23:21:45 +05:30
|
|
|
# rubocop: enable CodeReuse/ActiveRecord
|
2018-03-17 18:26:18 +05:30
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|