debian-mirror-gitlab/lib/extracts_path.rb

169 lines
5.9 KiB
Ruby
Raw Normal View History

2018-12-13 13:39:08 +05:30
# frozen_string_literal: true
2014-09-02 18:07:02 +05:30
# Module providing methods for dealing with separating a tree-ish string and a
# file path string when combined in a request parameter
module ExtractsPath
# Raised when given an invalid file path
2017-08-17 22:00:37 +05:30
InvalidPathError = Class.new(StandardError)
2014-09-02 18:07:02 +05:30
# Given a string containing both a Git tree-ish, such as a branch or tag, and
# a filesystem path joined by forward slashes, attempts to separate the two.
#
# Expects a @project instance variable to contain the active project. This is
# used to check the input against a list of valid repository refs.
#
# Examples
#
# # No @project available
# extract_ref('master')
# # => ['', '']
#
# extract_ref('master')
# # => ['master', '']
#
# extract_ref("f4b14494ef6abf3d144c28e4af0c20143383e062/CHANGELOG")
# # => ['f4b14494ef6abf3d144c28e4af0c20143383e062', 'CHANGELOG']
#
# extract_ref("v2.0.0/README.md")
# # => ['v2.0.0', 'README.md']
#
# extract_ref('master/app/models/project.rb')
# # => ['master', 'app/models/project.rb']
#
# extract_ref('issues/1234/app/models/project.rb')
# # => ['issues/1234', 'app/models/project.rb']
#
# # Given an invalid branch, we fall back to just splitting on the first slash
# extract_ref('non/existent/branch/README.md')
# # => ['non', 'existent/branch/README.md']
#
# Returns an Array where the first value is the tree-ish and the second is the
# path
def extract_ref(id)
pair = ['', '']
2018-03-17 18:26:18 +05:30
return pair unless @project # rubocop:disable Gitlab/ModuleWithInstanceVariables
2014-09-02 18:07:02 +05:30
2017-08-17 22:00:37 +05:30
if id =~ /^(\h{40})(.+)/
2014-09-02 18:07:02 +05:30
# If the ref appears to be a SHA, we're done, just split the string
pair = $~.captures
else
# Otherwise, attempt to detect the ref using a list of the project's
# branches and tags
# Append a trailing slash if we only get a ref and no file path
2018-12-13 13:39:08 +05:30
unless id.ends_with?('/')
id = [id, '/'].join
end
2014-09-02 18:07:02 +05:30
2016-11-03 12:29:30 +05:30
valid_refs = ref_names.select { |v| id.start_with?("#{v}/") }
2014-09-02 18:07:02 +05:30
2018-12-05 23:21:45 +05:30
if valid_refs.empty?
2014-09-02 18:07:02 +05:30
# No exact ref match, so just try our best
2018-03-17 18:26:18 +05:30
pair = id.match(%r{([^/]+)(.*)}).captures
2014-09-02 18:07:02 +05:30
else
2015-09-11 14:41:01 +05:30
# There is a distinct possibility that multiple refs prefix the ID.
# Use the longest match to maximize the chance that we have the
# right ref.
best_match = valid_refs.max_by(&:length)
2014-09-02 18:07:02 +05:30
# Partition the string into the ref and the path, ignoring the empty first value
2015-09-11 14:41:01 +05:30
pair = id.partition(best_match)[1..-1]
2014-09-02 18:07:02 +05:30
end
end
# Remove ending slashes from path
2018-03-17 18:26:18 +05:30
pair[1].gsub!(%r{^/|/$}, '')
2014-09-02 18:07:02 +05:30
pair
end
2016-11-03 12:29:30 +05:30
# If we have an ID of 'foo.atom', and the controller provides Atom and HTML
# formats, then we have to check if the request was for the Atom version of
# the ID without the '.atom' suffix, or the HTML version of the ID including
# the suffix. We only check this if the version including the suffix doesn't
# match, so it is possible to create a branch which has an unroutable Atom
# feed.
def extract_ref_without_atom(id)
id_without_atom = id.sub(/\.atom$/, '')
valid_refs = ref_names.select { |v| "#{id_without_atom}/".start_with?("#{v}/") }
valid_refs.max_by(&:length)
end
2014-09-02 18:07:02 +05:30
# Assigns common instance variables for views working with Git tree-ish objects
#
# Assignments are:
#
# - @id - A string representing the joined ref and path
# - @ref - A string representing the ref (e.g., the branch, tag, or commit SHA)
# - @path - A string representing the filesystem path
# - @commit - A Commit representing the commit from the given ref
#
# If the :id parameter appears to be requesting a specific response format,
# that will be handled as well.
#
2016-11-03 12:29:30 +05:30
# If there is no path and the ref doesn't exist in the repo, try to resolve
# the ref without an '.atom' suffix. If _that_ ref is found, set the request's
# format to Atom manually.
#
2014-09-02 18:07:02 +05:30
# Automatically renders `not_found!` if a valid tree path could not be
# resolved (e.g., when a user inserts an invalid path or ref).
2018-03-17 18:26:18 +05:30
# rubocop:disable Gitlab/ModuleWithInstanceVariables
2014-09-02 18:07:02 +05:30
def assign_ref_vars
# assign allowed options
2017-08-17 22:00:37 +05:30
allowed_options = ["filter_ref"]
2014-09-02 18:07:02 +05:30
@options = params.select {|key, value| allowed_options.include?(key) && !value.blank? }
@options = HashWithIndifferentAccess.new(@options)
2016-09-29 09:46:39 +05:30
@id = get_id
2014-09-02 18:07:02 +05:30
@ref, @path = extract_ref(@id)
@repo = @project.repository
2016-11-03 12:29:30 +05:30
2017-08-17 22:00:37 +05:30
@commit = @repo.commit(@ref)
2016-11-03 12:29:30 +05:30
2017-08-17 22:00:37 +05:30
if @path.empty? && !@commit && @id.ends_with?('.atom')
@id = @ref = extract_ref_without_atom(@id)
@commit = @repo.commit(@ref)
2016-11-03 12:29:30 +05:30
2017-08-17 22:00:37 +05:30
request.format = :atom if @commit
2014-09-02 18:07:02 +05:30
end
raise InvalidPathError unless @commit
@hex_path = Digest::SHA1.hexdigest(@path)
2017-09-10 17:25:29 +05:30
@logs_path = logs_file_project_ref_path(@project, @ref, @path)
2014-09-02 18:07:02 +05:30
rescue RuntimeError, NoMethodError, InvalidPathError
2015-10-24 18:46:33 +05:30
render_404
2014-09-02 18:07:02 +05:30
end
2018-03-17 18:26:18 +05:30
# rubocop:enable Gitlab/ModuleWithInstanceVariables
2014-09-02 18:07:02 +05:30
def tree
2018-03-17 18:26:18 +05:30
@tree ||= @repo.tree(@commit.id, @path) # rubocop:disable Gitlab/ModuleWithInstanceVariables
end
def lfs_blob_ids
blob_ids = tree.blobs.map(&:id)
2018-11-18 11:00:15 +05:30
# When current endpoint is a Blob then `tree.blobs` will be empty, it means we need to analyze
# the current Blob in order to determine if it's a LFS object
blob_ids = Array.wrap(@repo.blob_at(@commit.id, @path)&.id) if blob_ids.empty? # rubocop:disable Gitlab/ModuleWithInstanceVariables
2018-03-17 18:26:18 +05:30
@lfs_blob_ids = Gitlab::Git::Blob.batch_lfs_pointers(@project.repository, blob_ids).map(&:id) # rubocop:disable Gitlab/ModuleWithInstanceVariables
2014-09-02 18:07:02 +05:30
end
2016-09-29 09:46:39 +05:30
private
2018-12-13 13:39:08 +05:30
# overridden in subclasses, do not remove
2016-09-29 09:46:39 +05:30
def get_id
2018-12-13 13:39:08 +05:30
id = [params[:id] || params[:ref]]
id << "/" + params[:path] unless params[:path].blank?
id.join
2016-09-29 09:46:39 +05:30
end
2016-11-03 12:29:30 +05:30
def ref_names
2018-03-17 18:26:18 +05:30
return [] unless @project # rubocop:disable Gitlab/ModuleWithInstanceVariables
2016-11-03 12:29:30 +05:30
2018-03-17 18:26:18 +05:30
@ref_names ||= @project.repository.ref_names # rubocop:disable Gitlab/ModuleWithInstanceVariables
2016-11-03 12:29:30 +05:30
end
2014-09-02 18:07:02 +05:30
end