2019-12-04 20:38:33 +05:30
|
|
|
# frozen_string_literal: true
|
|
|
|
|
2018-11-08 19:23:39 +05:30
|
|
|
require 'fast_spec_helper'
|
2020-03-13 15:44:24 +05:30
|
|
|
require 'support/shared_examples/lib/gitlab/malicious_regexp_shared_examples'
|
2017-08-17 22:00:37 +05:30
|
|
|
|
2023-06-09 08:11:10 +05:30
|
|
|
RSpec.describe Gitlab::UntrustedRegexp, feature_category: :shared do
|
2017-08-17 22:00:37 +05:30
|
|
|
describe '#initialize' do
|
|
|
|
subject { described_class.new(pattern) }
|
|
|
|
|
|
|
|
context 'invalid regexp' do
|
|
|
|
let(:pattern) { '[' }
|
|
|
|
|
|
|
|
it { expect { subject }.to raise_error(RegexpError) }
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
describe '#replace_all' do
|
|
|
|
it 'replaces all instances of the match in a string' do
|
|
|
|
result = described_class.new('foo').replace_all('foo bar foo', 'oof')
|
|
|
|
|
|
|
|
expect(result).to eq('oof bar oof')
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2023-06-09 08:11:10 +05:30
|
|
|
describe '#replace_gsub' do
|
|
|
|
let(:regex_str) { '(?P<scheme>(ftp))' }
|
|
|
|
let(:regex) { described_class.new(regex_str, multiline: true) }
|
|
|
|
|
|
|
|
def result(regex, text)
|
|
|
|
regex.replace_gsub(text) do |match|
|
|
|
|
if match[:scheme]
|
|
|
|
"http|#{match[:scheme]}|rss"
|
|
|
|
else
|
|
|
|
match.to_s
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
it 'replaces all instances of the match in a string' do
|
|
|
|
text = 'Use only https instead of ftp'
|
|
|
|
|
|
|
|
expect(result(regex, text)).to eq('Use only https instead of http|ftp|rss')
|
|
|
|
end
|
|
|
|
|
|
|
|
it 'replaces nothing when no match' do
|
|
|
|
text = 'Use only https instead of gopher'
|
|
|
|
|
|
|
|
expect(result(regex, text)).to eq(text)
|
|
|
|
end
|
|
|
|
|
|
|
|
it 'handles empty text' do
|
|
|
|
text = ''
|
|
|
|
|
|
|
|
expect(result(regex, text)).to eq('')
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2017-08-17 22:00:37 +05:30
|
|
|
describe '#replace' do
|
|
|
|
it 'replaces the first instance of the match in a string' do
|
|
|
|
result = described_class.new('foo').replace('foo bar foo', 'oof')
|
|
|
|
|
|
|
|
expect(result).to eq('oof bar foo')
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
describe '#===' do
|
|
|
|
it 'returns true for a match' do
|
|
|
|
result = described_class.new('foo') === 'a foo here'
|
|
|
|
|
|
|
|
expect(result).to be_truthy
|
|
|
|
end
|
|
|
|
|
|
|
|
it 'returns false for no match' do
|
|
|
|
result = described_class.new('foo') === 'a bar here'
|
|
|
|
|
|
|
|
expect(result).to be_falsy
|
|
|
|
end
|
2018-11-08 19:23:39 +05:30
|
|
|
|
|
|
|
it 'can handle regular expressions in multiline mode' do
|
|
|
|
regexp = described_class.new('^\d', multiline: true)
|
|
|
|
|
|
|
|
result = regexp === "Header\n\n1. Content"
|
|
|
|
|
|
|
|
expect(result).to be_truthy
|
|
|
|
end
|
2017-08-17 22:00:37 +05:30
|
|
|
end
|
|
|
|
|
2019-04-03 18:18:56 +05:30
|
|
|
describe '#match?' do
|
|
|
|
subject { described_class.new(regexp).match?(text) }
|
|
|
|
|
|
|
|
context 'malicious regexp' do
|
|
|
|
let(:text) { malicious_text }
|
|
|
|
let(:regexp) { malicious_regexp_re2 }
|
|
|
|
|
|
|
|
include_examples 'malicious regexp'
|
|
|
|
end
|
|
|
|
|
|
|
|
context 'matching regexp' do
|
|
|
|
let(:regexp) { 'foo' }
|
|
|
|
let(:text) { 'foo' }
|
|
|
|
|
|
|
|
it 'returns an array of nil matches' do
|
|
|
|
is_expected.to eq(true)
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
context 'non-matching regexp' do
|
|
|
|
let(:regexp) { 'boo' }
|
|
|
|
let(:text) { 'foo' }
|
|
|
|
|
|
|
|
it 'returns an array of nil matches' do
|
|
|
|
is_expected.to eq(false)
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2017-08-17 22:00:37 +05:30
|
|
|
describe '#scan' do
|
|
|
|
subject { described_class.new(regexp).scan(text) }
|
2019-04-03 18:18:56 +05:30
|
|
|
|
2017-08-17 22:00:37 +05:30
|
|
|
context 'malicious regexp' do
|
|
|
|
let(:text) { malicious_text }
|
2019-04-03 18:18:56 +05:30
|
|
|
let(:regexp) { malicious_regexp_re2 }
|
2017-08-17 22:00:37 +05:30
|
|
|
|
|
|
|
include_examples 'malicious regexp'
|
|
|
|
end
|
|
|
|
|
|
|
|
context 'empty regexp' do
|
|
|
|
let(:regexp) { '' }
|
|
|
|
let(:text) { 'foo' }
|
|
|
|
|
2017-09-10 17:25:29 +05:30
|
|
|
it 'returns an array of nil matches' do
|
|
|
|
is_expected.to eq([nil, nil, nil, nil])
|
2017-08-17 22:00:37 +05:30
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
context 'empty capture group regexp' do
|
|
|
|
let(:regexp) { '()' }
|
|
|
|
let(:text) { 'foo' }
|
|
|
|
|
2017-09-10 17:25:29 +05:30
|
|
|
it 'returns an array of nil matches in an array' do
|
|
|
|
is_expected.to eq([[nil], [nil], [nil], [nil]])
|
2017-08-17 22:00:37 +05:30
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
context 'no capture group' do
|
|
|
|
let(:regexp) { '.+' }
|
|
|
|
let(:text) { 'foo' }
|
|
|
|
|
|
|
|
it 'returns the whole match' do
|
|
|
|
is_expected.to eq(['foo'])
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
context 'one capture group' do
|
|
|
|
let(:regexp) { '(f).+' }
|
|
|
|
let(:text) { 'foo' }
|
|
|
|
|
|
|
|
it 'returns the captured part' do
|
|
|
|
is_expected.to eq([%w[f]])
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
context 'two capture groups' do
|
|
|
|
let(:regexp) { '(f).(o)' }
|
|
|
|
let(:text) { 'foo' }
|
|
|
|
|
|
|
|
it 'returns the captured parts' do
|
|
|
|
is_expected.to eq([%w[f o]])
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
2021-04-29 21:17:54 +05:30
|
|
|
|
2023-06-09 08:11:10 +05:30
|
|
|
describe '#extract_named_group' do
|
|
|
|
let(:re) { described_class.new('(?P<name>\w+) (?P<age>\d+)|(?P<name_only>\w+)') }
|
|
|
|
let(:text) { 'Bob 40' }
|
|
|
|
|
|
|
|
it 'returns values for both named groups' do
|
|
|
|
matched = re.scan(text).first
|
|
|
|
|
|
|
|
expect(re.extract_named_group(:name, matched)).to eq 'Bob'
|
|
|
|
expect(re.extract_named_group(:age, matched)).to eq '40'
|
|
|
|
end
|
|
|
|
|
|
|
|
it 'returns nil if there was no match for group' do
|
|
|
|
matched = re.scan('Bob').first
|
|
|
|
|
|
|
|
expect(re.extract_named_group(:name, matched)).to be_nil
|
|
|
|
expect(re.extract_named_group(:age, matched)).to be_nil
|
|
|
|
expect(re.extract_named_group(:name_only, matched)).to eq 'Bob'
|
|
|
|
end
|
|
|
|
|
|
|
|
it 'returns nil if match is nil' do
|
|
|
|
matched = '(?P<age>\d+)'.scan(text).first
|
|
|
|
|
|
|
|
expect(re.extract_named_group(:age, matched)).to be_nil
|
|
|
|
end
|
|
|
|
|
|
|
|
it 'raises if name is not a capture group' do
|
|
|
|
matched = re.scan(text).first
|
|
|
|
|
|
|
|
expect { re.extract_named_group(:foo, matched) }.to raise_error('Invalid named capture group: foo')
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2021-04-29 21:17:54 +05:30
|
|
|
describe '#match' do
|
|
|
|
context 'when there are matches' do
|
|
|
|
it 'returns a match object' do
|
|
|
|
result = described_class.new('(?P<number>\d+)').match('hello 10')
|
|
|
|
|
|
|
|
expect(result[:number]).to eq('10')
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
context 'when there are no matches' do
|
|
|
|
it 'returns nil' do
|
|
|
|
result = described_class.new('(?P<number>\d+)').match('hello')
|
|
|
|
|
|
|
|
expect(result).to be_nil
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
2017-08-17 22:00:37 +05:30
|
|
|
end
|