83 lines
2.3 KiB
Ruby
83 lines
2.3 KiB
Ruby
# frozen_string_literal: true
|
|
|
|
module Gitlab
|
|
module Search
|
|
class Query < SimpleDelegator
|
|
include EncodingHelper
|
|
|
|
QUOTES_REGEXP = %r{\A"|"\Z}.freeze
|
|
TOKEN_WITH_QUOTES_REGEXP = %r{\s(?=(?:[^"]|"[^"]*")*$)}.freeze
|
|
|
|
def initialize(query, filter_opts = {}, &block)
|
|
@raw_query = query.dup
|
|
@filters = []
|
|
@filter_options = { default_parser: :downcase.to_proc }.merge(filter_opts)
|
|
|
|
self.instance_eval(&block) if block
|
|
|
|
@query = Gitlab::Search::ParsedQuery.new(*extract_filters)
|
|
# set the ParsedQuery as our default delegator thanks to SimpleDelegator
|
|
super(@query)
|
|
end
|
|
|
|
private
|
|
|
|
def filter(name, **attributes)
|
|
filter = {
|
|
parser: @filter_options[:default_parser],
|
|
name: name
|
|
}.merge(attributes)
|
|
|
|
@filters << filter
|
|
end
|
|
|
|
def filter_options(**options)
|
|
@filter_options.merge!(options)
|
|
end
|
|
|
|
def extract_filters
|
|
fragments = []
|
|
|
|
query_tokens = parse_raw_query
|
|
filters = @filters.each_with_object([]) do |filter, parsed_filters|
|
|
matches = query_tokens.select { |part| part =~ /\A-?#{filter[:name]}:/ }
|
|
|
|
next unless matches.any?
|
|
|
|
matches.each do |match|
|
|
query_filter = filter.dup
|
|
|
|
input = match.split(':')[1..].join
|
|
|
|
next if input.empty?
|
|
|
|
query_filter[:negated] = match.start_with?("-")
|
|
query_filter[:value] = parse_filter(query_filter, input.gsub(QUOTES_REGEXP, ''))
|
|
query_filter[:regex_value] = Regexp.escape(query_filter[:value]).gsub('\*', '.*?')
|
|
|
|
fragments << match
|
|
parsed_filters << query_filter
|
|
end
|
|
end
|
|
|
|
query = (query_tokens - fragments).join(' ')
|
|
query = '*' if query.empty?
|
|
|
|
[query, filters]
|
|
end
|
|
|
|
def parse_filter(filter, input)
|
|
result = filter[:parser].call(input)
|
|
|
|
@filter_options[:encode_binary] ? encode_binary(result) : result
|
|
end
|
|
|
|
def parse_raw_query
|
|
# Positive lookahead for any non-quote char or even number of quotes
|
|
# for example '"search term" path:"foo bar.txt"' would break into
|
|
# ["search term", "path:\"foo bar.txt\""]
|
|
@raw_query.split(TOKEN_WITH_QUOTES_REGEXP).reject(&:empty?)
|
|
end
|
|
end
|
|
end
|
|
end
|