2021-03-11 19:13:27 +05:30
# frozen_string_literal: true
module Gitlab
module Database
module MigrationHelpers
module V2
include Gitlab :: Database :: MigrationHelpers
2021-11-11 11:23:49 +05:30
# Creates a new table, optionally allowing the caller to add text limit constraints to the table.
# This method only extends Rails' `create_table` method
#
# Example:
#
# create_table :db_guides do |t|
# t.bigint :stars, default: 0, null: false
# t.text :title, limit: 128
# t.text :notes, limit: 1024
#
# t.check_constraint 'stars > 1000', name: 'so_many_stars'
# end
#
# See Rails' `create_table` for more info on the available arguments.
#
# When adding foreign keys to other tables, consider wrapping the call into a with_lock_retries block
# to avoid traffic stalls.
def create_table ( table_name , * args , ** kwargs , & block )
helper_context = self
super do | t |
t . define_singleton_method ( :text ) do | column_name , ** kwargs |
limit = kwargs . delete ( :limit )
super ( column_name , ** kwargs )
if limit
# rubocop:disable GitlabSecurity/PublicSend
name = helper_context . send ( :text_limit_name , table_name , column_name )
# rubocop:enable GitlabSecurity/PublicSend
column_name = helper_context . quote_column_name ( column_name )
definition = " char_length( #{ column_name } ) <= #{ limit } "
t . check_constraint ( definition , name : name )
end
end
t . instance_eval ( & block ) unless block . nil?
end
end
# Executes the block with a retry mechanism that alters the +lock_timeout+ and +sleep_time+ between attempts.
# The timings can be controlled via the +timing_configuration+ parameter.
# If the lock was not acquired within the retry period, a last attempt is made without using +lock_timeout+.
#
# In order to retry the block, the method wraps the block into a transaction.
#
# When called inside an open transaction it will execute the block directly if lock retries are enabled
# with `enable_lock_retries!` at migration level, otherwise it will raise an error.
#
# ==== Examples
# # Invoking without parameters
# with_lock_retries do
# drop_table :my_table
# end
#
# # Invoking with custom +timing_configuration+
# t = [
# [1.second, 1.second],
# [2.seconds, 2.seconds]
# ]
#
# with_lock_retries(timing_configuration: t) do
# drop_table :my_table # this will be retried twice
# end
#
# # Disabling the retries using an environment variable
# > export DISABLE_LOCK_RETRIES=true
#
# with_lock_retries do
# drop_table :my_table # one invocation, it will not retry at all
# end
#
# ==== Parameters
# * +timing_configuration+ - [[ActiveSupport::Duration, ActiveSupport::Duration], ...] lock timeout for the block, sleep time before the next iteration, defaults to `Gitlab::Database::WithLockRetries::DEFAULT_TIMING_CONFIGURATION`
# * +logger+ - [Gitlab::JsonLogger]
# * +env+ - [Hash] custom environment hash, see the example with `DISABLE_LOCK_RETRIES`
def with_lock_retries ( * args , ** kwargs , & block )
if transaction_open?
if enable_lock_retries?
Gitlab :: AppLogger . warn 'Lock retries already enabled, executing the block directly'
yield
else
raise << ~ EOF
#{__callee__} can not be run inside an already open transaction
Use migration - level lock retries instead , see https : / / docs . gitlab . com / ee / development / migration_style_guide . html #retry-mechanism-when-acquiring-database-locks
EOF
end
else
super ( * args , ** kwargs . merge ( allow_savepoints : false ) , & block )
end
end
2021-03-11 19:13:27 +05:30
# Renames a column without requiring downtime.
#
# Concurrent renames work by using database triggers to ensure both the
# old and new column are in sync. However, this method will _not_ remove
# the triggers or the old column automatically; this needs to be done
# manually in a post-deployment migration. This can be done using the
# method `cleanup_concurrent_column_rename`.
#
# table - The name of the database table containing the column.
# old_column - The old column name.
# new_column - The new column name.
# type - The type of the new column. If no type is given the old column's
# type is used.
# batch_column_name - option is for tables without primary key, in this
# case another unique integer column can be used. Example: :user_id
def rename_column_concurrently ( table , old_column , new_column , type : nil , batch_column_name : :id )
2022-06-21 17:19:12 +05:30
Gitlab :: Database :: QueryAnalyzers :: RestrictAllowedSchemas . require_ddl_mode!
2021-03-11 19:13:27 +05:30
setup_renamed_column ( __callee__ , table , old_column , new_column , type , batch_column_name )
with_lock_retries do
install_bidirectional_triggers ( table , old_column , new_column )
end
end
# Reverses operations performed by rename_column_concurrently.
#
# This method takes care of removing previously installed triggers as well
# as removing the new column.
#
# table - The name of the database table.
# old_column - The name of the old column.
# new_column - The name of the new column.
def undo_rename_column_concurrently ( table , old_column , new_column )
teardown_rename_mechanism ( table , old_column , new_column , column_to_remove : new_column )
end
# Cleans up a concurrent column name.
#
# This method takes care of removing previously installed triggers as well
# as removing the old column.
#
# table - The name of the database table.
# old_column - The name of the old column.
# new_column - The name of the new column.
def cleanup_concurrent_column_rename ( table , old_column , new_column )
teardown_rename_mechanism ( table , old_column , new_column , column_to_remove : old_column )
end
# Reverses the operations performed by cleanup_concurrent_column_rename.
#
# This method adds back the old_column removed
# by cleanup_concurrent_column_rename.
# It also adds back the triggers that are removed
# by cleanup_concurrent_column_rename.
#
# table - The name of the database table containing the column.
# old_column - The old column name.
# new_column - The new column name.
# type - The type of the old column. If no type is given the new column's
# type is used.
# batch_column_name - option is for tables without primary key, in this
# case another unique integer column can be used. Example: :user_id
#
def undo_cleanup_concurrent_column_rename ( table , old_column , new_column , type : nil , batch_column_name : :id )
2022-06-21 17:19:12 +05:30
Gitlab :: Database :: QueryAnalyzers :: RestrictAllowedSchemas . require_ddl_mode!
2021-03-11 19:13:27 +05:30
setup_renamed_column ( __callee__ , table , new_column , old_column , type , batch_column_name )
with_lock_retries do
install_bidirectional_triggers ( table , old_column , new_column )
end
end
2023-07-09 08:55:56 +05:30
# TRUNCATE is a DDL statement (it drops the table and re-creates it), so we want to run the
# migration in DDL mode, but we also don't want to execute it against all schemas because
# it will be prevented by the lock_writes trigger.
#
# For example,
# a `gitlab_main` table on `:gitlab_main` database will be truncated,
# and a `gitlab_main` table on `:gitlab_ci` database will be skipped.
#
# Note Rails already has a truncate_tables, see
# https://github.com/rails/rails/blob/6-1-stable/activerecord/lib/active_record/connection_adapters/abstract/database_statements.rb#L193
def truncate_tables! ( * table_names , connection : self . connection )
table_schemas = Gitlab :: Database :: GitlabSchema . table_schemas! ( table_names )
raise ArgumentError , " `table_names` must resolve to only one `gitlab_schema` " if table_schemas . size != 1
return unless Gitlab :: Database . gitlab_schemas_for_connection ( connection ) . include? ( table_schemas . first )
quoted_tables = table_names . map { | table_name | quote_table_name ( table_name ) } . join ( ', ' )
execute ( " TRUNCATE TABLE #{ quoted_tables } " )
end
2021-03-11 19:13:27 +05:30
private
def setup_renamed_column ( calling_operation , table , old_column , new_column , type , batch_column_name )
if transaction_open?
raise " #{ calling_operation } can not be run inside a transaction "
end
column = columns ( table ) . find { | column | column . name == old_column . to_s }
unless column
raise " Column #{ old_column } does not exist on #{ table } "
end
2023-01-13 00:05:48 +05:30
if column . default_function
raise " #{ calling_operation } does not currently support columns with default functions "
2021-03-11 19:13:27 +05:30
end
unless column_exists? ( table , batch_column_name )
raise " Column #{ batch_column_name } does not exist on #{ table } "
end
check_trigger_permissions! ( table )
unless column_exists? ( table , new_column )
create_column_from ( table , old_column , new_column , type : type , batch_column_name : batch_column_name )
end
end
def teardown_rename_mechanism ( table , old_column , new_column , column_to_remove : )
return unless column_exists? ( table , column_to_remove )
with_lock_retries do
check_trigger_permissions! ( table )
remove_bidirectional_triggers ( table , old_column , new_column )
remove_column ( table , column_to_remove )
end
end
def install_bidirectional_triggers ( table , old_column , new_column )
insert_trigger_name , update_old_trigger_name , update_new_trigger_name =
bidirectional_trigger_names ( table , old_column , new_column )
quoted_table = quote_table_name ( table )
quoted_old = quote_column_name ( old_column )
quoted_new = quote_column_name ( new_column )
create_insert_trigger ( insert_trigger_name , quoted_table , quoted_old , quoted_new )
create_update_trigger ( update_old_trigger_name , quoted_table , quoted_new , quoted_old )
create_update_trigger ( update_new_trigger_name , quoted_table , quoted_old , quoted_new )
end
def remove_bidirectional_triggers ( table , old_column , new_column )
insert_trigger_name , update_old_trigger_name , update_new_trigger_name =
bidirectional_trigger_names ( table , old_column , new_column )
quoted_table = quote_table_name ( table )
drop_trigger ( insert_trigger_name , quoted_table )
drop_trigger ( update_old_trigger_name , quoted_table )
drop_trigger ( update_new_trigger_name , quoted_table )
end
def bidirectional_trigger_names ( table , old_column , new_column )
%w[ insert update_old update_new ] . map do | operation |
'trigger_' + Digest :: SHA256 . hexdigest ( " #{ table } _ #{ old_column } _ #{ new_column } _ #{ operation } " ) . first ( 12 )
end
end
def function_name_for_trigger ( trigger_name )
" function_for_ #{ trigger_name } "
end
def create_insert_trigger ( trigger_name , quoted_table , quoted_old_column , quoted_new_column )
function_name = function_name_for_trigger ( trigger_name )
2023-01-13 00:05:48 +05:30
column = columns ( quoted_table . delete ( '"' ) . to_sym ) . find { | column | column . name == quoted_old_column . delete ( '"' ) }
quoted_default_value = connection . quote ( column . default )
2021-03-11 19:13:27 +05:30
execute ( << ~ SQL )
CREATE OR REPLACE FUNCTION #{function_name}()
RETURNS trigger
LANGUAGE plpgsql
AS $$
BEGIN
2023-01-13 00:05:48 +05:30
IF NEW . #{quoted_old_column} IS NOT DISTINCT FROM #{quoted_default_value} AND NEW.#{quoted_new_column} IS DISTINCT FROM #{quoted_default_value} THEN
2021-03-11 19:13:27 +05:30
NEW . #{quoted_old_column} = NEW.#{quoted_new_column};
END IF ;
2023-01-13 00:05:48 +05:30
IF NEW . #{quoted_new_column} IS NOT DISTINCT FROM #{quoted_default_value} AND NEW.#{quoted_old_column} IS DISTINCT FROM #{quoted_default_value} THEN
2021-03-11 19:13:27 +05:30
NEW . #{quoted_new_column} = NEW.#{quoted_old_column};
END IF ;
RETURN NEW ;
END
$$ ;
DROP TRIGGER IF EXISTS #{trigger_name}
ON #{quoted_table};
CREATE TRIGGER #{trigger_name}
BEFORE INSERT ON #{quoted_table}
FOR EACH ROW EXECUTE FUNCTION #{function_name}();
SQL
end
def create_update_trigger ( trigger_name , quoted_table , quoted_source_column , quoted_target_column )
function_name = function_name_for_trigger ( trigger_name )
execute ( << ~ SQL )
CREATE OR REPLACE FUNCTION #{function_name}()
RETURNS trigger
LANGUAGE plpgsql
AS $$
BEGIN
NEW . #{quoted_target_column} := NEW.#{quoted_source_column};
RETURN NEW ;
END
$$ ;
DROP TRIGGER IF EXISTS #{trigger_name}
ON #{quoted_table};
CREATE TRIGGER #{trigger_name}
BEFORE UPDATE OF #{quoted_source_column} ON #{quoted_table}
FOR EACH ROW EXECUTE FUNCTION #{function_name}();
SQL
end
def drop_trigger ( trigger_name , quoted_table )
function_name = function_name_for_trigger ( trigger_name )
execute ( << ~ SQL )
DROP TRIGGER IF EXISTS #{trigger_name}
ON #{quoted_table};
DROP FUNCTION IF EXISTS #{function_name};
SQL
end
end
end
end
end