98 lines
3.1 KiB
Ruby
98 lines
3.1 KiB
Ruby
# frozen_string_literal: true
|
|
|
|
# This module is used in:
|
|
# - SingleEndpointDiffNotesImporter
|
|
# - SingleEndpointIssueNotesImporter
|
|
# - SingleEndpointMergeRequestNotesImporter
|
|
# if `github_importer_single_endpoint_notes_import` feature flag is on.
|
|
#
|
|
# - SingleEndpointIssueEventsImporter
|
|
# if `github_importer_issue_events_import` feature flag is on.
|
|
#
|
|
# Fetches associated objects page by page to each item of parent collection.
|
|
# Currently `associated` is note or event.
|
|
# Currently `parent` is MergeRequest or Issue record.
|
|
#
|
|
# It fetches 1 PR's associated objects at a time using `issue_comments` or
|
|
# `pull_request_comments` endpoint, which is slower than `NotesImporter`
|
|
# but it makes sure all notes are imported, as it can sometimes not be
|
|
# the case for `NotesImporter`, because `issues_comments` endpoint
|
|
# it uses can be limited by GitHub API to not return all available pages.
|
|
module Gitlab
|
|
module GithubImport
|
|
module SingleEndpointNotesImporting
|
|
BATCH_SIZE = 100
|
|
|
|
def each_object_to_import(&block)
|
|
each_associated_page do |parent_record, associated_page|
|
|
associated_page.objects.each do |associated|
|
|
each_associated(parent_record, associated, &block)
|
|
end
|
|
end
|
|
end
|
|
|
|
def id_for_already_imported_cache(associated)
|
|
associated.id
|
|
end
|
|
|
|
def parent_collection
|
|
raise NotImplementedError
|
|
end
|
|
|
|
def parent_imported_cache_key
|
|
raise NotImplementedError
|
|
end
|
|
|
|
def page_counter_id(parent)
|
|
raise NotImplementedError
|
|
end
|
|
|
|
private
|
|
|
|
# Sometimes we need to add some extra info from parent
|
|
# to associated record that is not available by default
|
|
# in Github API response object. For example:
|
|
# lib/gitlab/github_import/importer/single_endpoint_issue_events_importer.rb:26
|
|
def each_associated(_parent_record, associated)
|
|
return if already_imported?(associated)
|
|
|
|
Gitlab::GithubImport::ObjectCounter.increment(project, object_type, :fetched)
|
|
|
|
yield(associated)
|
|
|
|
mark_as_imported(associated)
|
|
end
|
|
|
|
def each_associated_page
|
|
parent_collection.each_batch(of: BATCH_SIZE, column: :iid) do |batch|
|
|
batch.each do |parent_record|
|
|
# The page counter needs to be scoped by parent_record to avoid skipping
|
|
# pages of notes from already imported parent_record.
|
|
page_counter = PageCounter.new(project, page_counter_id(parent_record))
|
|
repo = project.import_source
|
|
options = collection_options.merge(page: page_counter.current)
|
|
|
|
client.each_page(collection_method, repo, parent_record.iid, options) do |page|
|
|
next unless page_counter.set(page.number)
|
|
|
|
yield parent_record, page
|
|
end
|
|
|
|
mark_parent_imported(parent_record)
|
|
end
|
|
end
|
|
end
|
|
|
|
def mark_parent_imported(parent)
|
|
Gitlab::Cache::Import::Caching.set_add(
|
|
parent_imported_cache_key,
|
|
parent.iid
|
|
)
|
|
end
|
|
|
|
def already_imported_parents
|
|
Gitlab::Cache::Import::Caching.values_from_set(parent_imported_cache_key)
|
|
end
|
|
end
|
|
end
|
|
end
|