debian-mirror-gitlab/app/models/merge_request_diff_commit.rb

133 lines
4.5 KiB
Ruby
Raw Normal View History

2018-11-18 11:00:15 +05:30
# frozen_string_literal: true
2019-07-07 11:18:12 +05:30
class MergeRequestDiffCommit < ApplicationRecord
2021-03-11 19:13:27 +05:30
extend SuppressCompositePrimaryKeyWarning
2020-03-13 15:44:24 +05:30
include BulkInsertSafe
2017-09-10 17:25:29 +05:30
include ShaAttribute
2020-03-13 15:44:24 +05:30
include CachedCommit
2021-12-11 22:18:48 +05:30
include IgnorableColumns
include FromUnion
ignore_column %i[author_name author_email committer_name committer_email],
remove_with: '14.6',
remove_after: '2021-11-22'
2017-09-10 17:25:29 +05:30
belongs_to :merge_request_diff
2021-09-30 23:02:18 +05:30
# This relation is called `commit_author` and not `author`, as the project
# import/export logic treats relations named `author` as instances of the
# `User` class.
#
# NOTE: these columns are _not_ indexed, nor do they use foreign keys.
#
# This is deliberate, as creating these indexes on GitLab.com takes a _very_
# long time. In addition, there's no real need for them either based on how
# this data is used.
#
# For more information, refer to the following:
#
# - https://gitlab.com/gitlab-com/gl-infra/production/-/issues/5038#note_614592881
# - https://gitlab.com/gitlab-org/gitlab/-/merge_requests/63669
belongs_to :commit_author, class_name: 'MergeRequest::DiffCommitUser'
belongs_to :committer, class_name: 'MergeRequest::DiffCommitUser'
2017-09-10 17:25:29 +05:30
sha_attribute :sha
alias_attribute :id, :sha
2021-09-04 01:27:46 +05:30
serialize :trailers, Serializers::Json # rubocop:disable Cop/ActiveRecordSerialize
2021-03-11 19:13:27 +05:30
validates :trailers, json_schema: { filename: 'git_trailers' }
2021-09-30 23:02:18 +05:30
scope :with_users, -> { preload(:commit_author, :committer) }
# A list of keys of which their values need to be trimmed before they can be
# inserted into the merge_request_diff_commit_users table.
TRIM_USER_KEYS =
%i[author_name author_email committer_name committer_email].freeze
2020-04-08 14:13:33 +05:30
# Deprecated; use `bulk_insert!` from `BulkInsertSafe` mixin instead.
# cf. https://gitlab.com/gitlab-org/gitlab/issues/207989 for progress
2017-09-10 17:25:29 +05:30
def self.create_bulk(merge_request_diff_id, commits)
2021-09-30 23:02:18 +05:30
commit_hashes, user_tuples = prepare_commits_for_bulk_insert(commits)
users = MergeRequest::DiffCommitUser.bulk_find_or_create(user_tuples)
rows = commit_hashes.map.with_index do |commit_hash, index|
2017-09-10 17:25:29 +05:30
sha = commit_hash.delete(:id)
2021-09-30 23:02:18 +05:30
author = users[[commit_hash[:author_name], commit_hash[:author_email]]]
committer =
users[[commit_hash[:committer_name], commit_hash[:committer_email]]]
2017-09-10 17:25:29 +05:30
2021-12-11 22:18:48 +05:30
# These fields are only used to determine the author/committer IDs, we
# don't store them in the DB.
commit_hash = commit_hash
.except(:author_name, :author_email, :committer_name, :committer_email)
2017-09-10 17:25:29 +05:30
commit_hash.merge(
2021-12-11 22:18:48 +05:30
commit_author_id: author.id,
committer_id: committer.id,
2017-09-10 17:25:29 +05:30
merge_request_diff_id: merge_request_diff_id,
relative_order: index,
2020-03-13 15:44:24 +05:30
sha: Gitlab::Database::ShaAttribute.serialize(sha), # rubocop:disable Cop/ActiveRecordSerialize
2018-03-17 18:26:18 +05:30
authored_date: Gitlab::Database.sanitize_timestamp(commit_hash[:authored_date]),
2021-03-11 19:13:27 +05:30
committed_date: Gitlab::Database.sanitize_timestamp(commit_hash[:committed_date]),
2023-01-13 00:05:48 +05:30
trailers: Gitlab::Json.dump(commit_hash.fetch(:trailers, {}))
2017-09-10 17:25:29 +05:30
)
end
2021-12-11 22:18:48 +05:30
ApplicationRecord.legacy_bulk_insert(self.table_name, rows) # rubocop:disable Gitlab/BulkInsert
2017-09-10 17:25:29 +05:30
end
2021-03-11 19:13:27 +05:30
2021-09-30 23:02:18 +05:30
def self.prepare_commits_for_bulk_insert(commits)
user_tuples = Set.new
hashes = commits.map do |commit|
hash = commit.to_hash.except(:parent_ids)
TRIM_USER_KEYS.each do |key|
hash[key] = MergeRequest::DiffCommitUser.prepare(hash[key])
end
user_tuples << [hash[:author_name], hash[:author_email]]
user_tuples << [hash[:committer_name], hash[:committer_email]]
hash
end
[hashes, user_tuples]
end
2021-03-11 19:13:27 +05:30
def self.oldest_merge_request_id_per_commit(project_id, shas)
# This method is defined here and not on MergeRequest, otherwise the SHA
# values used in the WHERE below won't be encoded correctly.
select(['merge_request_diff_commits.sha AS sha', 'min(merge_requests.id) AS merge_request_id'])
.joins(:merge_request_diff)
.joins(
'INNER JOIN merge_requests ' \
'ON merge_requests.latest_merge_request_diff_id = merge_request_diffs.id'
)
.where(sha: shas)
.where(
merge_requests: {
target_project_id: project_id,
state_id: MergeRequest.available_states[:merged]
}
)
.group(:sha)
end
2021-09-30 23:02:18 +05:30
def author_name
2021-12-11 22:18:48 +05:30
commit_author&.name
2021-09-30 23:02:18 +05:30
end
def author_email
2021-12-11 22:18:48 +05:30
commit_author&.email
2021-09-30 23:02:18 +05:30
end
def committer_name
2021-12-11 22:18:48 +05:30
committer&.name
2021-09-30 23:02:18 +05:30
end
def committer_email
2021-12-11 22:18:48 +05:30
committer&.email
2021-09-30 23:02:18 +05:30
end
2017-09-10 17:25:29 +05:30
end