debian-mirror-gitlab/spec/lib/gitlab/untrusted_regexp_spec.rb

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

223 lines
5.4 KiB
Ruby
Raw Normal View History

2019-12-04 20:38:33 +05:30
# frozen_string_literal: true
2018-11-08 19:23:39 +05:30
require 'fast_spec_helper'
2020-03-13 15:44:24 +05:30
require 'support/shared_examples/lib/gitlab/malicious_regexp_shared_examples'
2017-08-17 22:00:37 +05:30
2023-06-09 08:11:10 +05:30
RSpec.describe Gitlab::UntrustedRegexp, feature_category: :shared do
2017-08-17 22:00:37 +05:30
describe '#initialize' do
subject { described_class.new(pattern) }
context 'invalid regexp' do
let(:pattern) { '[' }
it { expect { subject }.to raise_error(RegexpError) }
end
end
describe '#replace_all' do
it 'replaces all instances of the match in a string' do
result = described_class.new('foo').replace_all('foo bar foo', 'oof')
expect(result).to eq('oof bar oof')
end
end
2023-06-09 08:11:10 +05:30
describe '#replace_gsub' do
let(:regex_str) { '(?P<scheme>(ftp))' }
let(:regex) { described_class.new(regex_str, multiline: true) }
def result(regex, text)
regex.replace_gsub(text) do |match|
if match[:scheme]
"http|#{match[:scheme]}|rss"
else
match.to_s
end
end
end
it 'replaces all instances of the match in a string' do
text = 'Use only https instead of ftp'
expect(result(regex, text)).to eq('Use only https instead of http|ftp|rss')
end
it 'replaces nothing when no match' do
text = 'Use only https instead of gopher'
expect(result(regex, text)).to eq(text)
end
it 'handles empty text' do
text = ''
expect(result(regex, text)).to eq('')
end
end
2017-08-17 22:00:37 +05:30
describe '#replace' do
it 'replaces the first instance of the match in a string' do
result = described_class.new('foo').replace('foo bar foo', 'oof')
expect(result).to eq('oof bar foo')
end
end
describe '#===' do
it 'returns true for a match' do
result = described_class.new('foo') === 'a foo here'
expect(result).to be_truthy
end
it 'returns false for no match' do
result = described_class.new('foo') === 'a bar here'
expect(result).to be_falsy
end
2018-11-08 19:23:39 +05:30
it 'can handle regular expressions in multiline mode' do
regexp = described_class.new('^\d', multiline: true)
result = regexp === "Header\n\n1. Content"
expect(result).to be_truthy
end
2017-08-17 22:00:37 +05:30
end
2019-04-03 18:18:56 +05:30
describe '#match?' do
subject { described_class.new(regexp).match?(text) }
context 'malicious regexp' do
let(:text) { malicious_text }
let(:regexp) { malicious_regexp_re2 }
include_examples 'malicious regexp'
end
context 'matching regexp' do
let(:regexp) { 'foo' }
let(:text) { 'foo' }
it 'returns an array of nil matches' do
is_expected.to eq(true)
end
end
context 'non-matching regexp' do
let(:regexp) { 'boo' }
let(:text) { 'foo' }
it 'returns an array of nil matches' do
is_expected.to eq(false)
end
end
end
2017-08-17 22:00:37 +05:30
describe '#scan' do
subject { described_class.new(regexp).scan(text) }
2019-04-03 18:18:56 +05:30
2017-08-17 22:00:37 +05:30
context 'malicious regexp' do
let(:text) { malicious_text }
2019-04-03 18:18:56 +05:30
let(:regexp) { malicious_regexp_re2 }
2017-08-17 22:00:37 +05:30
include_examples 'malicious regexp'
end
context 'empty regexp' do
let(:regexp) { '' }
let(:text) { 'foo' }
2017-09-10 17:25:29 +05:30
it 'returns an array of nil matches' do
is_expected.to eq([nil, nil, nil, nil])
2017-08-17 22:00:37 +05:30
end
end
context 'empty capture group regexp' do
let(:regexp) { '()' }
let(:text) { 'foo' }
2017-09-10 17:25:29 +05:30
it 'returns an array of nil matches in an array' do
is_expected.to eq([[nil], [nil], [nil], [nil]])
2017-08-17 22:00:37 +05:30
end
end
context 'no capture group' do
let(:regexp) { '.+' }
let(:text) { 'foo' }
it 'returns the whole match' do
is_expected.to eq(['foo'])
end
end
context 'one capture group' do
let(:regexp) { '(f).+' }
let(:text) { 'foo' }
it 'returns the captured part' do
is_expected.to eq([%w[f]])
end
end
context 'two capture groups' do
let(:regexp) { '(f).(o)' }
let(:text) { 'foo' }
it 'returns the captured parts' do
is_expected.to eq([%w[f o]])
end
end
end
2021-04-29 21:17:54 +05:30
2023-06-09 08:11:10 +05:30
describe '#extract_named_group' do
let(:re) { described_class.new('(?P<name>\w+) (?P<age>\d+)|(?P<name_only>\w+)') }
let(:text) { 'Bob 40' }
it 'returns values for both named groups' do
matched = re.scan(text).first
expect(re.extract_named_group(:name, matched)).to eq 'Bob'
expect(re.extract_named_group(:age, matched)).to eq '40'
end
it 'returns nil if there was no match for group' do
matched = re.scan('Bob').first
expect(re.extract_named_group(:name, matched)).to be_nil
expect(re.extract_named_group(:age, matched)).to be_nil
expect(re.extract_named_group(:name_only, matched)).to eq 'Bob'
end
it 'returns nil if match is nil' do
matched = '(?P<age>\d+)'.scan(text).first
expect(re.extract_named_group(:age, matched)).to be_nil
end
it 'raises if name is not a capture group' do
matched = re.scan(text).first
expect { re.extract_named_group(:foo, matched) }.to raise_error('Invalid named capture group: foo')
end
end
2021-04-29 21:17:54 +05:30
describe '#match' do
context 'when there are matches' do
it 'returns a match object' do
result = described_class.new('(?P<number>\d+)').match('hello 10')
expect(result[:number]).to eq('10')
end
end
context 'when there are no matches' do
it 'returns nil' do
result = described_class.new('(?P<number>\d+)').match('hello')
expect(result).to be_nil
end
end
end
2017-08-17 22:00:37 +05:30
end