debian-mirror-gitlab/spec/models/concerns/pg_full_text_searchable_spec.rb

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

239 lines
8.9 KiB
Ruby
Raw Permalink Normal View History

2022-05-07 20:08:51 +05:30
# frozen_string_literal: true
require 'spec_helper'
2023-04-23 21:23:45 +05:30
RSpec.describe PgFullTextSearchable, feature_category: :global_search do
2023-03-04 22:38:38 +05:30
let(:project) { build(:project, project_namespace: build(:project_namespace)) }
2022-05-07 20:08:51 +05:30
let(:model_class) do
Class.new(ActiveRecord::Base) do
include PgFullTextSearchable
self.table_name = 'issues'
belongs_to :project
2023-03-04 22:38:38 +05:30
belongs_to :namespace
2022-05-07 20:08:51 +05:30
has_one :search_data, class_name: 'Issues::SearchData'
2022-08-13 15:12:31 +05:30
before_validation -> { self.work_item_type_id = ::WorkItems::Type.default_issue_type.id }
2022-05-07 20:08:51 +05:30
def persist_pg_full_text_search_vector(search_vector)
Issues::SearchData.upsert({ project_id: project_id, issue_id: id, search_vector: search_vector }, unique_by: %i(project_id issue_id))
end
def self.name
'Issue'
end
end
end
describe '.pg_full_text_searchable' do
it 'sets pg_full_text_searchable_columns' do
model_class.pg_full_text_searchable columns: [{ name: 'title', weight: 'A' }]
expect(model_class.pg_full_text_searchable_columns).to eq({ 'title' => 'A' })
end
it 'raises an error when called twice' do
model_class.pg_full_text_searchable columns: [{ name: 'title', weight: 'A' }]
expect { model_class.pg_full_text_searchable columns: [{ name: 'title', weight: 'A' }] }.to raise_error('Full text search columns already defined!')
end
end
describe 'after commit hook' do
2023-03-04 22:38:38 +05:30
let(:model) { model_class.create!(project: project, namespace: project.project_namespace) }
2022-05-07 20:08:51 +05:30
before do
model_class.pg_full_text_searchable columns: [{ name: 'title', weight: 'A' }]
end
context 'when specified columns are changed' do
it 'calls update_search_data!' do
expect(model).to receive(:update_search_data!)
model.update!(title: 'A new title')
end
end
context 'when specified columns are not changed' do
2022-07-16 23:28:13 +05:30
it 'does not call update_search_data!' do
2022-05-07 20:08:51 +05:30
expect(model).not_to receive(:update_search_data!)
model.update!(description: 'A new description')
end
end
2022-07-16 23:28:13 +05:30
context 'when model is updated twice within a transaction' do
it 'calls update_search_data!' do
expect(model).to receive(:update_search_data!)
model.transaction do
model.update!(title: 'A new title')
model.update!(updated_at: Time.current)
end
end
end
2022-05-07 20:08:51 +05:30
end
describe '.pg_full_text_search' do
2023-03-04 22:38:38 +05:30
let(:english) { model_class.create!(project: project, namespace: project.project_namespace, title: 'title', description: 'something description english') }
let(:with_accent) { model_class.create!(project: project, namespace: project.project_namespace, title: 'Jürgen', description: 'Ærøskøbing') }
let(:japanese) { model_class.create!(project: project, namespace: project.project_namespace, title: '日本語 title', description: 'another english description') }
2022-05-07 20:08:51 +05:30
before do
model_class.pg_full_text_searchable columns: [{ name: 'title', weight: 'A' }, { name: 'description', weight: 'B' }]
[english, with_accent, japanese].each(&:update_search_data!)
end
it 'searches across all fields' do
expect(model_class.pg_full_text_search('title english')).to contain_exactly(english, japanese)
end
2023-01-13 00:05:48 +05:30
it 'searches specified columns only' do
2023-03-04 22:38:38 +05:30
matching_object = model_class.create!(project: project, namespace: project.project_namespace, title: 'english', description: 'some description')
2023-01-13 00:05:48 +05:30
matching_object.update_search_data!
expect(model_class.pg_full_text_search('english', matched_columns: %w(title))).to contain_exactly(matching_object)
end
it 'uses prefix matching' do
expect(model_class.pg_full_text_search('tit eng')).to contain_exactly(english, japanese)
end
2022-05-07 20:08:51 +05:30
it 'searches for exact term with quotes' do
2023-01-13 00:05:48 +05:30
expect(model_class.pg_full_text_search('"description english"')).to contain_exactly(english)
2022-05-07 20:08:51 +05:30
end
it 'ignores accents' do
expect(model_class.pg_full_text_search('jurgen')).to contain_exactly(with_accent)
2022-10-11 01:57:18 +05:30
expect(model_class.pg_full_text_search('Jürgen')).to contain_exactly(with_accent)
2022-05-07 20:08:51 +05:30
end
it 'does not support searching by non-Latin characters' do
expect(model_class.pg_full_text_search('日本')).to be_empty
end
2022-07-23 23:45:48 +05:30
context 'when search term has a URL' do
2023-03-04 22:38:38 +05:30
let(:with_url) { model_class.create!(project: project, namespace: project.project_namespace, title: 'issue with url', description: 'sample url,https://gitlab.com/gitlab-org/gitlab') }
2022-07-23 23:45:48 +05:30
it 'allows searching by full URL, ignoring the scheme' do
with_url.update_search_data!
expect(model_class.pg_full_text_search('https://gitlab.com/gitlab-org/gitlab')).to contain_exactly(with_url)
expect(model_class.pg_full_text_search('gopher://gitlab.com/gitlab-org/gitlab')).to contain_exactly(with_url)
end
end
2023-01-13 00:05:48 +05:30
context 'when search term is a path with underscores' do
let(:path) { 'browser_ui/5_package/package_registry/maven/maven_group_level_spec.rb' }
2023-03-04 22:38:38 +05:30
let(:with_underscore) { model_class.create!(project: project, namespace: project.project_namespace, title: 'issue with path', description: "some #{path} other text") }
2023-01-13 00:05:48 +05:30
it 'allows searching by the path' do
with_underscore.update_search_data!
expect(model_class.pg_full_text_search(path)).to contain_exactly(with_underscore)
end
end
context 'when text has numbers preceded by a dash' do
2023-03-04 22:38:38 +05:30
let(:with_dash) { model_class.create!(project: project, namespace: project.project_namespace, title: 'issue with dash', description: 'ABC-123') }
2023-01-13 00:05:48 +05:30
it 'allows searching by numbers only' do
with_dash.update_search_data!
expect(model_class.pg_full_text_search('123')).to contain_exactly(with_dash)
end
end
2022-05-07 20:08:51 +05:30
end
describe '#update_search_data!' do
2023-03-04 22:38:38 +05:30
let(:model) { model_class.create!(project: project, namespace: project.project_namespace, title: 'title', description: 'description') }
2022-05-07 20:08:51 +05:30
before do
model_class.pg_full_text_searchable columns: [{ name: 'title', weight: 'A' }, { name: 'description', weight: 'B' }]
end
it 'sets the correct weights' do
model.update_search_data!
expect(model.search_data.search_vector).to match(/'titl':1A/)
expect(model.search_data.search_vector).to match(/'descript':2B/)
end
context 'with accented and non-Latin characters' do
2023-03-04 22:38:38 +05:30
let(:model) { model_class.create!(project: project, namespace: project.project_namespace, title: '日本語', description: 'Jürgen') }
2022-05-07 20:08:51 +05:30
it 'transliterates accented characters and removes non-Latin ones' do
model.update_search_data!
expect(model.search_data.search_vector).not_to match(/日本語/)
expect(model.search_data.search_vector).to match(/jurgen/)
end
end
context 'with long words' do
2023-03-04 22:38:38 +05:30
let(:model) { model_class.create!(project: project, namespace: project.project_namespace, title: 'title ' + 'long/sequence+1' * 4, description: 'description ' + '@user1' * 20) }
2022-05-07 20:08:51 +05:30
it 'strips words that are 50 characters or longer' do
model.update_search_data!
expect(model.search_data.search_vector).to match(/'titl':1A/)
expect(model.search_data.search_vector).not_to match(/long/)
expect(model.search_data.search_vector).not_to match(/sequence/)
expect(model.search_data.search_vector).to match(/'descript':2B/)
expect(model.search_data.search_vector).not_to match(/@user1/)
end
end
context 'when upsert times out' do
it 're-raises the exception' do
expect(Issues::SearchData).to receive(:upsert).once.and_raise(ActiveRecord::StatementTimeout)
expect { model.update_search_data! }.to raise_error(ActiveRecord::StatementTimeout)
end
end
context 'with strings that go over tsvector limit', :delete do
let(:long_string) { Array.new(30_000) { SecureRandom.hex }.join(' ') }
2023-03-04 22:38:38 +05:30
let(:model) { model_class.create!(project: project, namespace: project.project_namespace, title: 'title', description: long_string) }
2022-05-07 20:08:51 +05:30
it 'does not raise an exception' do
expect(Gitlab::AppJsonLogger).to receive(:error).with(
a_hash_including(class: model_class.name, model_id: model.id)
)
expect { model.update_search_data! }.not_to raise_error
expect(model.search_data).to eq(nil)
end
end
context 'when model class does not implement persist_pg_full_text_search_vector' do
let(:model_class) do
Class.new(ActiveRecord::Base) do
include PgFullTextSearchable
self.table_name = 'issues'
belongs_to :project
2023-03-04 22:38:38 +05:30
belongs_to :namespace
2022-05-07 20:08:51 +05:30
has_one :search_data, class_name: 'Issues::SearchData'
2022-08-13 15:12:31 +05:30
before_validation -> { self.work_item_type_id = ::WorkItems::Type.default_issue_type.id }
2022-05-07 20:08:51 +05:30
def self.name
'Issue'
end
end
end
it 'raises an error' do
expect { model.update_search_data! }.to raise_error(NotImplementedError)
end
end
end
end