debian-mirror-gitlab/lib/gitlab/database/partitioning_migration_helpers/table_management_helpers.rb

# frozen_string_literal: true

module Gitlab
  module Database
    module PartitioningMigrationHelpers
      module TableManagementHelpers
        include ::Gitlab::Database::SchemaHelpers
        include ::Gitlab::Database::DynamicModelHelpers
        include ::Gitlab::Database::MigrationHelpers
        include ::Gitlab::Database::Migrations::BackgroundMigrationHelpers

        ALLOWED_TABLES = %w[audit_events].freeze
        ERROR_SCOPE = 'table partitioning'

        MIGRATION_CLASS_NAME = "::#{module_parent_name}::BackfillPartitionedTable"
        BATCH_INTERVAL = 2.minutes.freeze
        BATCH_SIZE = 50_000

        JobArguments = Struct.new(:start_id, :stop_id, :source_table_name, :partitioned_table_name, :source_column) do
          def self.from_array(arguments)
            self.new(*arguments)
          end
        end

        # Creates a partitioned copy of an existing table, using a RANGE partitioning strategy on a timestamp column.
        # One partition is created per month between the given `min_date` and `max_date`. Also installs a trigger on
        # the original table to copy writes into the partitioned table. To copy over historic data from before creation
        # of the partitioned table, use the `enqueue_partitioning_data_migration` helper in a post-deploy migration.
        #
        # A copy of the original table is required as PG currently does not support partitioning existing tables.
        #
        # Example:
        #
        #   partition_table_by_date :audit_events, :created_at, min_date: Date.new(2020, 1), max_date: Date.new(2020, 6)
        #
        # Options are:
        #   :min_date - a date specifying the lower bounds of the partition range
        #   :max_date - a date specifying the upper bounds of the partitioning range, defaults to today + 1 month
        #
        # Unless min_date is specified explicitly, we default to
        # 1. The minimum value for the partitioning column in the table
        # 2. If no data is present yet, the current month
        def partition_table_by_date(table_name, column_name, min_date: nil, max_date: nil)
          assert_table_is_allowed(table_name)

          assert_not_in_transaction_block(scope: ERROR_SCOPE)

          max_date ||= Date.today + 1.month

          min_date ||= connection.select_one(<<~SQL)['minimum'] || max_date - 1.month
            SELECT date_trunc('MONTH', MIN(#{column_name})) AS minimum
            FROM #{table_name}
          SQL

          raise "max_date #{max_date} must be greater than min_date #{min_date}" if min_date >= max_date

          primary_key = connection.primary_key(table_name)
          raise "primary key not defined for #{table_name}" if primary_key.nil?

          partition_column = find_column_definition(table_name, column_name)
          raise "partition column #{column_name} does not exist on #{table_name}" if partition_column.nil?

          partitioned_table_name = make_partitioned_table_name(table_name)

          transaction do
            create_range_partitioned_copy(table_name, partitioned_table_name, partition_column, primary_key)
            create_daterange_partitions(partitioned_table_name, partition_column.name, min_date, max_date)
          end
          create_trigger_to_sync_tables(table_name, partitioned_table_name, primary_key)
        end

        # Clean up a partitioned copy of an existing table. First, deletes the database function and trigger that were
        # used to copy writes to the partitioned table, then removes the partitioned table (also removing partitions).
        #
        # Example:
        #
        #   drop_partitioned_table_for :audit_events
        #
        def drop_partitioned_table_for(table_name)
          assert_table_is_allowed(table_name)
          assert_not_in_transaction_block(scope: ERROR_SCOPE)

          with_lock_retries do
            trigger_name = make_sync_trigger_name(table_name)
            drop_trigger(table_name, trigger_name)
          end

          function_name = make_sync_function_name(table_name)
          drop_function(function_name)

          partitioned_table_name = make_partitioned_table_name(table_name)
          drop_table(partitioned_table_name)
        end

        # Enqueue the background jobs that will backfill data in the partitioned table, by batch-copying records from
        # original table. This helper should be called from a post-deploy migration.
        #
        # Example:
        #
        #   enqueue_partitioning_data_migration :audit_events
        #
        def enqueue_partitioning_data_migration(table_name)
          assert_table_is_allowed(table_name)

          assert_not_in_transaction_block(scope: ERROR_SCOPE)

          partitioned_table_name = make_partitioned_table_name(table_name)
          primary_key = connection.primary_key(table_name)
          enqueue_background_migration(table_name, partitioned_table_name, primary_key)
        end

        # Cleanup a previously enqueued background migration to copy data into a partitioned table. This will not
        # prevent the enqueued jobs from executing, but instead cleans up information in the database used to track the
        # state of the background migration. It should be safe to also remove the partitioned table even if the
        # background jobs are still in-progress, as the absence of the table will cause them to safely exit.
        #
        # Example:
        #
        #   cleanup_partitioning_data_migration :audit_events
        #
        def cleanup_partitioning_data_migration(table_name)
          assert_table_is_allowed(table_name)

          cleanup_migration_jobs(table_name)
        end

        def create_hash_partitions(table_name, number_of_partitions)
          transaction do
            (0..number_of_partitions - 1).each do |partition|
              decimals = Math.log10(number_of_partitions).ceil
              suffix = "%0#{decimals}d" % partition
              partition_name = "#{table_name}_#{suffix}"
              schema = Gitlab::Database::STATIC_PARTITIONS_SCHEMA

              execute(<<~SQL)
                CREATE TABLE #{schema}.#{partition_name}
                PARTITION OF #{table_name}
                FOR VALUES WITH (MODULUS #{number_of_partitions}, REMAINDER #{partition});
              SQL
            end
          end
        end

        # Executes cleanup tasks from a previous BackgroundMigration to backfill a partitioned table by finishing
        # pending jobs and performing a final data synchronization.
        # This performs two steps:
        #   1. Wait to finish any pending BackgroundMigration jobs that have not succeeded
        #   2. Inline copy any missed rows from the original table to the partitioned table
        #
        # **NOTE** Migrations using this method cannot be scheduled in the same release as the migration that
        # schedules the background migration using the `enqueue_background_migration` helper, or else the
        # background migration jobs will be force-executed.
        #
        # Example:
        #
        #   finalize_backfilling_partitioned_table :audit_events
        #
        def finalize_backfilling_partitioned_table(table_name)
          assert_table_is_allowed(table_name)
          assert_not_in_transaction_block(scope: ERROR_SCOPE)

          partitioned_table_name = make_partitioned_table_name(table_name)
          unless table_exists?(partitioned_table_name)
            raise "could not find partitioned table for #{table_name}, " \
              "this could indicate the previous partitioning migration has been rolled back."
          end

          Gitlab::BackgroundMigration.steal(MIGRATION_CLASS_NAME) do |raw_arguments|
            JobArguments.from_array(raw_arguments).source_table_name == table_name.to_s
          end

          primary_key = connection.primary_key(table_name)
          copy_missed_records(table_name, partitioned_table_name, primary_key)

          disable_statement_timeout do
            execute("VACUUM FREEZE ANALYZE #{partitioned_table_name}")
          end
        end

        private

        def assert_table_is_allowed(table_name)
          return if ALLOWED_TABLES.include?(table_name.to_s)

          raise "partitioning helpers are in active development, and #{table_name} is not allowed for use, " \
            "for more information please contact the database team"
        end

        def make_partitioned_table_name(table)
          tmp_table_name("#{table}_part")
        end

        def make_sync_function_name(table)
          object_name(table, 'table_sync_function')
        end

        def make_sync_trigger_name(table)
          object_name(table, 'table_sync_trigger')
        end

        def find_column_definition(table, column)
          connection.columns(table).find { |c| c.name == column.to_s }
        end

        def create_range_partitioned_copy(source_table_name, partitioned_table_name, partition_column, primary_key)
          if table_exists?(partitioned_table_name)
            Gitlab::AppLogger.warn "Partitioned table not created because it already exists" \
              " (this may be due to an aborted migration or similar): table_name: #{partitioned_table_name} "
            return
          end

          tmp_column_name = object_name(partition_column.name, 'partition_key')
          transaction do
            execute(<<~SQL)
              CREATE TABLE #{partitioned_table_name} (
                LIKE #{source_table_name} INCLUDING ALL EXCLUDING INDEXES,
                #{tmp_column_name} #{partition_column.sql_type} NOT NULL,
                PRIMARY KEY (#{[primary_key, tmp_column_name].join(", ")})
              ) PARTITION BY RANGE (#{tmp_column_name})
            SQL

            remove_column(partitioned_table_name, partition_column.name)
            rename_column(partitioned_table_name, tmp_column_name, partition_column.name)
            change_column_default(partitioned_table_name, primary_key, nil)

            if column_of_type?(partitioned_table_name, primary_key, :integer)
              # Default to int8 primary keys to prevent overflow
              change_column(partitioned_table_name, primary_key, :bigint)
            end
          end
        end

        def column_of_type?(table_name, column, type)
          find_column_definition(table_name, column).type == type
        end

        def create_daterange_partitions(table_name, column_name, min_date, max_date)
          min_date = min_date.beginning_of_month.to_date
          max_date = max_date.next_month.beginning_of_month.to_date

          upper_bound = to_sql_date_literal(min_date)
          create_range_partition_safely("#{table_name}_000000", table_name, 'MINVALUE', upper_bound)

          while min_date < max_date
            partition_name = "#{table_name}_#{min_date.strftime('%Y%m')}"
            next_date = min_date.next_month
            lower_bound = to_sql_date_literal(min_date)
            upper_bound = to_sql_date_literal(next_date)

            create_range_partition_safely(partition_name, table_name, lower_bound, upper_bound)
            min_date = next_date
          end
        end

        def to_sql_date_literal(date)
          connection.quote(date.strftime('%Y-%m-%d'))
        end

        def create_range_partition_safely(partition_name, table_name, lower_bound, upper_bound)
          if table_exists?(table_for_range_partition(partition_name))
            Gitlab::AppLogger.warn "Partition not created because it already exists" \
              " (this may be due to an aborted migration or similar): partition_name: #{partition_name}"
            return
          end

          create_range_partition(partition_name, table_name, lower_bound, upper_bound)
        end

        def create_trigger_to_sync_tables(source_table_name, partitioned_table_name, unique_key)
          function_name = make_sync_function_name(source_table_name)
          trigger_name = make_sync_trigger_name(source_table_name)

          with_lock_retries do
            create_sync_function(function_name, partitioned_table_name, unique_key)
            create_comment('FUNCTION', function_name, "Partitioning migration: table sync for #{source_table_name} table")

            create_sync_trigger(source_table_name, trigger_name, function_name)
          end
        end

        def create_sync_function(name, partitioned_table_name, unique_key)
          if function_exists?(name)
            Gitlab::AppLogger.warn "Partitioning sync function not created because it already exists" \
              " (this may be due to an aborted migration or similar): function name: #{name}"
            return
          end

          delimiter = ",\n    "
          column_names = connection.columns(partitioned_table_name).map(&:name)
          set_statements = build_set_statements(column_names, unique_key)
          insert_values = column_names.map { |name| "NEW.#{name}" }

          create_trigger_function(name, replace: false) do
            <<~SQL
              IF (TG_OP = 'DELETE') THEN
                DELETE FROM #{partitioned_table_name} where #{unique_key} = OLD.#{unique_key};
              ELSIF (TG_OP = 'UPDATE') THEN
                UPDATE #{partitioned_table_name}
                SET #{set_statements.join(delimiter)}
                WHERE #{partitioned_table_name}.#{unique_key} = NEW.#{unique_key};
              ELSIF (TG_OP = 'INSERT') THEN
                INSERT INTO #{partitioned_table_name} (#{column_names.join(delimiter)})
                VALUES (#{insert_values.join(delimiter)});
              END IF;
              RETURN NULL;
            SQL
          end
        end

        def build_set_statements(column_names, unique_key)
          column_names.reject { |name| name == unique_key }.map { |name| "#{name} = NEW.#{name}" }
        end

        def create_sync_trigger(table_name, trigger_name, function_name)
          if trigger_exists?(table_name, trigger_name)
            Gitlab::AppLogger.warn "Partitioning sync trigger not created because it already exists" \
              " (this may be due to an aborted migration or similar): trigger name: #{trigger_name}"
            return
          end

          create_trigger(table_name, trigger_name, function_name, fires: 'AFTER INSERT OR UPDATE OR DELETE')
        end

        def enqueue_background_migration(source_table_name, partitioned_table_name, source_column)
          source_model = define_batchable_model(source_table_name)

          queue_background_migration_jobs_by_range_at_intervals(
            source_model,
            MIGRATION_CLASS_NAME,
            BATCH_INTERVAL,
            batch_size: BATCH_SIZE,
            other_job_arguments: [source_table_name.to_s, partitioned_table_name, source_column],
            track_jobs: true)
        end

        def cleanup_migration_jobs(table_name)
          ::Gitlab::Database::BackgroundMigrationJob.for_partitioning_migration(MIGRATION_CLASS_NAME, table_name).delete_all
        end

        def copy_missed_records(source_table_name, partitioned_table_name, source_column)
          backfill_table = BackfillPartitionedTable.new
          relation = ::Gitlab::Database::BackgroundMigrationJob.pending
            .for_partitioning_migration(MIGRATION_CLASS_NAME, source_table_name)

          relation.each_batch do |batch|
            batch.each do |pending_migration_job|
              job_arguments = JobArguments.from_array(pending_migration_job.arguments)
              start_id = job_arguments.start_id
              stop_id = job_arguments.stop_id

              say("Backfilling data into partitioned table for ids from #{start_id} to #{stop_id}")
              job_updated_count = backfill_table.perform(start_id, stop_id, source_table_name,
                partitioned_table_name, source_column)

              unless job_updated_count > 0
                raise "failed to update tracking record for ids from #{start_id} to #{stop_id}"
              end
            end
          end
        end
      end
    end
  end
end
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`# frozen_string_literal: true`

			`module Gitlab`
			`module Database`
			`module PartitioningMigrationHelpers`
			`module TableManagementHelpers`
			`include ::Gitlab::Database::SchemaHelpers`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`include ::Gitlab::Database::DynamicModelHelpers`
New upstream version 13.4.6 2020-11-24 15:15:51 +05:30			`include ::Gitlab::Database::MigrationHelpers`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`include ::Gitlab::Database::Migrations::BackgroundMigrationHelpers`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`ALLOWED_TABLES = %w[audit_events].freeze`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`ERROR_SCOPE = 'table partitioning'`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`MIGRATION_CLASS_NAME = "::#{module_parent_name}::BackfillPartitionedTable"`
			`BATCH_INTERVAL = 2.minutes.freeze`
			`BATCH_SIZE = 50_000`

New upstream version 13.4.6 2020-11-24 15:15:51 +05:30			`JobArguments = Struct.new(:start_id, :stop_id, :source_table_name, :partitioned_table_name, :source_column) do`
			`def self.from_array(arguments)`
			`self.new(*arguments)`
			`end`
			`end`

New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`# Creates a partitioned copy of an existing table, using a RANGE partitioning strategy on a timestamp column.`
New upstream version 13.3.8 2020-10-24 23:57:45 +05:30			# One partition is created per month between the given `min_date` and `max_date`. Also installs a trigger on
			`# the original table to copy writes into the partitioned table. To copy over historic data from before creation`
			# of the partitioned table, use the `enqueue_partitioning_data_migration` helper in a post-deploy migration.
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`#`
			`# A copy of the original table is required as PG currently does not support partitioning existing tables.`
			`#`
			`# Example:`
			`#`
			`# partition_table_by_date :audit_events, :created_at, min_date: Date.new(2020, 1), max_date: Date.new(2020, 6)`
			`#`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`# Options are:`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`# :min_date - a date specifying the lower bounds of the partition range`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`# :max_date - a date specifying the upper bounds of the partitioning range, defaults to today + 1 month`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`#`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`# Unless min_date is specified explicitly, we default to`
			`# 1. The minimum value for the partitioning column in the table`
			`# 2. If no data is present yet, the current month`
			`def partition_table_by_date(table_name, column_name, min_date: nil, max_date: nil)`
			`assert_table_is_allowed(table_name)`

New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`assert_not_in_transaction_block(scope: ERROR_SCOPE)`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`max_date \|\|= Date.today + 1.month`

			`min_date \|\|= connection.select_one(<<~SQL)['minimum'] \|\| max_date - 1.month`
			`SELECT date_trunc('MONTH', MIN(#{column_name})) AS minimum`
			`FROM #{table_name}`
			`SQL`

New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`raise "max_date #{max_date} must be greater than min_date #{min_date}" if min_date >= max_date`

			`primary_key = connection.primary_key(table_name)`
			`raise "primary key not defined for #{table_name}" if primary_key.nil?`

			`partition_column = find_column_definition(table_name, column_name)`
			`raise "partition column #{column_name} does not exist on #{table_name}" if partition_column.nil?`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`partitioned_table_name = make_partitioned_table_name(table_name)`

New upstream version 13.3.8 2020-10-24 23:57:45 +05:30			`transaction do`
			`create_range_partitioned_copy(table_name, partitioned_table_name, partition_column, primary_key)`
			`create_daterange_partitions(partitioned_table_name, partition_column.name, min_date, max_date)`
			`end`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`create_trigger_to_sync_tables(table_name, partitioned_table_name, primary_key)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`end`

New upstream version 13.3.8 2020-10-24 23:57:45 +05:30			`# Clean up a partitioned copy of an existing table. First, deletes the database function and trigger that were`
			`# used to copy writes to the partitioned table, then removes the partitioned table (also removing partitions).`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`#`
			`# Example:`
			`#`
			`# drop_partitioned_table_for :audit_events`
			`#`
			`def drop_partitioned_table_for(table_name)`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`assert_table_is_allowed(table_name)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`assert_not_in_transaction_block(scope: ERROR_SCOPE)`

			`with_lock_retries do`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`trigger_name = make_sync_trigger_name(table_name)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`drop_trigger(table_name, trigger_name)`
			`end`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`function_name = make_sync_function_name(table_name)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`drop_function(function_name)`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`partitioned_table_name = make_partitioned_table_name(table_name)`
			`drop_table(partitioned_table_name)`
			`end`

New upstream version 13.3.8 2020-10-24 23:57:45 +05:30			`# Enqueue the background jobs that will backfill data in the partitioned table, by batch-copying records from`
			`# original table. This helper should be called from a post-deploy migration.`
			`#`
			`# Example:`
			`#`
			`# enqueue_partitioning_data_migration :audit_events`
			`#`
			`def enqueue_partitioning_data_migration(table_name)`
			`assert_table_is_allowed(table_name)`

			`assert_not_in_transaction_block(scope: ERROR_SCOPE)`

			`partitioned_table_name = make_partitioned_table_name(table_name)`
			`primary_key = connection.primary_key(table_name)`
			`enqueue_background_migration(table_name, partitioned_table_name, primary_key)`
			`end`

			`# Cleanup a previously enqueued background migration to copy data into a partitioned table. This will not`
			`# prevent the enqueued jobs from executing, but instead cleans up information in the database used to track the`
			`# state of the background migration. It should be safe to also remove the partitioned table even if the`
			`# background jobs are still in-progress, as the absence of the table will cause them to safely exit.`
			`#`
			`# Example:`
			`#`
			`# cleanup_partitioning_data_migration :audit_events`
			`#`
			`def cleanup_partitioning_data_migration(table_name)`
			`assert_table_is_allowed(table_name)`

			`cleanup_migration_jobs(table_name)`
			`end`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`def create_hash_partitions(table_name, number_of_partitions)`
			`transaction do`
			`(0..number_of_partitions - 1).each do \|partition\|`
			`decimals = Math.log10(number_of_partitions).ceil`
			`suffix = "%0#{decimals}d" % partition`
			`partition_name = "#{table_name}_#{suffix}"`
			`schema = Gitlab::Database::STATIC_PARTITIONS_SCHEMA`

			`execute(<<~SQL)`
			`CREATE TABLE #{schema}.#{partition_name}`
			`PARTITION OF #{table_name}`
			`FOR VALUES WITH (MODULUS #{number_of_partitions}, REMAINDER #{partition});`
			`SQL`
			`end`
			`end`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`end`

New upstream version 13.4.6 2020-11-24 15:15:51 +05:30			`# Executes cleanup tasks from a previous BackgroundMigration to backfill a partitioned table by finishing`
			`# pending jobs and performing a final data synchronization.`
			`# This performs two steps:`
			`# 1. Wait to finish any pending BackgroundMigration jobs that have not succeeded`
			`# 2. Inline copy any missed rows from the original table to the partitioned table`
			`#`
			`# NOTE Migrations using this method cannot be scheduled in the same release as the migration that`
			# schedules the background migration using the `enqueue_background_migration` helper, or else the
			`# background migration jobs will be force-executed.`
			`#`
			`# Example:`
			`#`
			`# finalize_backfilling_partitioned_table :audit_events`
			`#`
			`def finalize_backfilling_partitioned_table(table_name)`
			`assert_table_is_allowed(table_name)`
			`assert_not_in_transaction_block(scope: ERROR_SCOPE)`

			`partitioned_table_name = make_partitioned_table_name(table_name)`
			`unless table_exists?(partitioned_table_name)`
			`raise "could not find partitioned table for #{table_name}, " \`
			`"this could indicate the previous partitioning migration has been rolled back."`
			`end`

			`Gitlab::BackgroundMigration.steal(MIGRATION_CLASS_NAME) do \|raw_arguments\|`
			`JobArguments.from_array(raw_arguments).source_table_name == table_name.to_s`
			`end`

			`primary_key = connection.primary_key(table_name)`
			`copy_missed_records(table_name, partitioned_table_name, primary_key)`

			`disable_statement_timeout do`
			`execute("VACUUM FREEZE ANALYZE #{partitioned_table_name}")`
			`end`
			`end`

New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`private`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`def assert_table_is_allowed(table_name)`
			`return if ALLOWED_TABLES.include?(table_name.to_s)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`raise "partitioning helpers are in active development, and #{table_name} is not allowed for use, " \`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`"for more information please contact the database team"`
			`end`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`def make_partitioned_table_name(table)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`tmp_table_name("#{table}_part")`
			`end`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`def make_sync_function_name(table)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`object_name(table, 'table_sync_function')`
			`end`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`def make_sync_trigger_name(table)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`object_name(table, 'table_sync_trigger')`
			`end`

			`def find_column_definition(table, column)`
			`connection.columns(table).find { \|c\| c.name == column.to_s }`
			`end`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`def create_range_partitioned_copy(source_table_name, partitioned_table_name, partition_column, primary_key)`
			`if table_exists?(partitioned_table_name)`
New upstream version 13.4.6 2020-11-24 15:15:51 +05:30			`Gitlab::AppLogger.warn "Partitioned table not created because it already exists" \`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`" (this may be due to an aborted migration or similar): table_name: #{partitioned_table_name} "`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`return`
			`end`

			`tmp_column_name = object_name(partition_column.name, 'partition_key')`
			`transaction do`
			`execute(<<~SQL)`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`CREATE TABLE #{partitioned_table_name} (`
			`LIKE #{source_table_name} INCLUDING ALL EXCLUDING INDEXES,`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`#{tmp_column_name} #{partition_column.sql_type} NOT NULL,`
			`PRIMARY KEY (#{[primary_key, tmp_column_name].join(", ")})`
			`) PARTITION BY RANGE (#{tmp_column_name})`
			`SQL`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`remove_column(partitioned_table_name, partition_column.name)`
			`rename_column(partitioned_table_name, tmp_column_name, partition_column.name)`
			`change_column_default(partitioned_table_name, primary_key, nil)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`if column_of_type?(partitioned_table_name, primary_key, :integer)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`# Default to int8 primary keys to prevent overflow`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`change_column(partitioned_table_name, primary_key, :bigint)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`end`
			`end`
			`end`

			`def column_of_type?(table_name, column, type)`
			`find_column_definition(table_name, column).type == type`
			`end`

			`def create_daterange_partitions(table_name, column_name, min_date, max_date)`
			`min_date = min_date.beginning_of_month.to_date`
			`max_date = max_date.next_month.beginning_of_month.to_date`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`upper_bound = to_sql_date_literal(min_date)`
			`create_range_partition_safely("#{table_name}_000000", table_name, 'MINVALUE', upper_bound)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30
			`while min_date < max_date`
			`partition_name = "#{table_name}_#{min_date.strftime('%Y%m')}"`
			`next_date = min_date.next_month`
			`lower_bound = to_sql_date_literal(min_date)`
			`upper_bound = to_sql_date_literal(next_date)`

			`create_range_partition_safely(partition_name, table_name, lower_bound, upper_bound)`
			`min_date = next_date`
			`end`
			`end`

			`def to_sql_date_literal(date)`
			`connection.quote(date.strftime('%Y-%m-%d'))`
			`end`

			`def create_range_partition_safely(partition_name, table_name, lower_bound, upper_bound)`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`if table_exists?(table_for_range_partition(partition_name))`
New upstream version 13.4.6 2020-11-24 15:15:51 +05:30			`Gitlab::AppLogger.warn "Partition not created because it already exists" \`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`" (this may be due to an aborted migration or similar): partition_name: #{partition_name}"`
			`return`
			`end`

			`create_range_partition(partition_name, table_name, lower_bound, upper_bound)`
			`end`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`def create_trigger_to_sync_tables(source_table_name, partitioned_table_name, unique_key)`
			`function_name = make_sync_function_name(source_table_name)`
			`trigger_name = make_sync_trigger_name(source_table_name)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30
			`with_lock_retries do`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`create_sync_function(function_name, partitioned_table_name, unique_key)`
			`create_comment('FUNCTION', function_name, "Partitioning migration: table sync for #{source_table_name} table")`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`create_sync_trigger(source_table_name, trigger_name, function_name)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`end`
			`end`

New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`def create_sync_function(name, partitioned_table_name, unique_key)`
			`if function_exists?(name)`
New upstream version 13.4.6 2020-11-24 15:15:51 +05:30			`Gitlab::AppLogger.warn "Partitioning sync function not created because it already exists" \`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`" (this may be due to an aborted migration or similar): function name: #{name}"`
			`return`
			`end`

New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`delimiter = ",\n "`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`column_names = connection.columns(partitioned_table_name).map(&:name)`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`set_statements = build_set_statements(column_names, unique_key)`
			`insert_values = column_names.map { \|name\| "NEW.#{name}" }`

			`create_trigger_function(name, replace: false) do`
			`<<~SQL`
			`IF (TG_OP = 'DELETE') THEN`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`DELETE FROM #{partitioned_table_name} where #{unique_key} = OLD.#{unique_key};`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`ELSIF (TG_OP = 'UPDATE') THEN`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`UPDATE #{partitioned_table_name}`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`SET #{set_statements.join(delimiter)}`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`WHERE #{partitioned_table_name}.#{unique_key} = NEW.#{unique_key};`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`ELSIF (TG_OP = 'INSERT') THEN`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`INSERT INTO #{partitioned_table_name} (#{column_names.join(delimiter)})`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`VALUES (#{insert_values.join(delimiter)});`
			`END IF;`
			`RETURN NULL;`
			`SQL`
			`end`
			`end`

			`def build_set_statements(column_names, unique_key)`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`column_names.reject { \|name\| name == unique_key }.map { \|name\| "#{name} = NEW.#{name}" }`
			`end`

			`def create_sync_trigger(table_name, trigger_name, function_name)`
			`if trigger_exists?(table_name, trigger_name)`
New upstream version 13.4.6 2020-11-24 15:15:51 +05:30			`Gitlab::AppLogger.warn "Partitioning sync trigger not created because it already exists" \`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`" (this may be due to an aborted migration or similar): trigger name: #{trigger_name}"`
			`return`
			`end`

			`create_trigger(table_name, trigger_name, function_name, fires: 'AFTER INSERT OR UPDATE OR DELETE')`
			`end`

New upstream version 13.4.6 2020-11-24 15:15:51 +05:30			`def enqueue_background_migration(source_table_name, partitioned_table_name, source_column)`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`source_model = define_batchable_model(source_table_name)`

			`queue_background_migration_jobs_by_range_at_intervals(`
			`source_model,`
			`MIGRATION_CLASS_NAME,`
			`BATCH_INTERVAL,`
			`batch_size: BATCH_SIZE,`
New upstream version 13.4.6 2020-11-24 15:15:51 +05:30			`other_job_arguments: [source_table_name.to_s, partitioned_table_name, source_column],`
New upstream version 13.2.1 2020-07-28 23:09:34 +05:30			`track_jobs: true)`
			`end`

			`def cleanup_migration_jobs(table_name)`
			`::Gitlab::Database::BackgroundMigrationJob.for_partitioning_migration(MIGRATION_CLASS_NAME, table_name).delete_all`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`end`
New upstream version 13.4.6 2020-11-24 15:15:51 +05:30
			`def copy_missed_records(source_table_name, partitioned_table_name, source_column)`
			`backfill_table = BackfillPartitionedTable.new`
			`relation = ::Gitlab::Database::BackgroundMigrationJob.pending`
			`.for_partitioning_migration(MIGRATION_CLASS_NAME, source_table_name)`

			`relation.each_batch do \|batch\|`
			`batch.each do \|pending_migration_job\|`
			`job_arguments = JobArguments.from_array(pending_migration_job.arguments)`
			`start_id = job_arguments.start_id`
			`stop_id = job_arguments.stop_id`

			`say("Backfilling data into partitioned table for ids from #{start_id} to #{stop_id}")`
			`job_updated_count = backfill_table.perform(start_id, stop_id, source_table_name,`
			`partitioned_table_name, source_column)`

			`unless job_updated_count > 0`
			`raise "failed to update tracking record for ids from #{start_id} to #{stop_id}"`
			`end`
			`end`
			`end`
			`end`
New upstream version 13.1.0 2020-06-23 00:09:42 +05:30			`end`
			`end`
			`end`
			`end`