385 lines
		
	
	
		
			13 KiB
		
	
	
	
		
			Ruby
		
	
	
	
			
		
		
	
	
			385 lines
		
	
	
		
			13 KiB
		
	
	
	
		
			Ruby
		
	
	
	
| # frozen_string_literal: true
 | ||
| 
 | ||
| module Gitlab
 | ||
|   module Database
 | ||
|     # Minimum PostgreSQL version requirement per documentation:
 | ||
|     # https://docs.gitlab.com/ee/install/requirements.html#postgresql-requirements
 | ||
|     MINIMUM_POSTGRES_VERSION = 11
 | ||
| 
 | ||
|     # Upcoming PostgreSQL version requirements
 | ||
|     # Allows a soft warning about an upcoming minimum version requirement
 | ||
|     # so administrators can prepare to upgrade
 | ||
|     UPCOMING_POSTGRES_VERSION_DETAILS = {
 | ||
|       gl_version: '13.6.0',
 | ||
|       gl_version_date: 'November 22, 2020',
 | ||
|       pg_version_minimum: 12,
 | ||
|       url: 'https://gitlab.com/groups/gitlab-org/-/epics/2374'
 | ||
|     }.freeze
 | ||
| 
 | ||
|     # Specifies the maximum number of days in advance to display a notice
 | ||
|     # regarding an upcoming PostgreSQL version deprecation.
 | ||
|     DEPRECATION_WINDOW_DAYS = 90
 | ||
| 
 | ||
|     # https://www.postgresql.org/docs/9.2/static/datatype-numeric.html
 | ||
|     MAX_INT_VALUE = 2147483647
 | ||
| 
 | ||
|     # The max value between MySQL's TIMESTAMP and PostgreSQL's timestampz:
 | ||
|     # https://www.postgresql.org/docs/9.1/static/datatype-datetime.html
 | ||
|     # https://dev.mysql.com/doc/refman/5.7/en/datetime.html
 | ||
|     # FIXME: this should just be the max value of timestampz
 | ||
|     MAX_TIMESTAMP_VALUE = Time.at((1 << 31) - 1).freeze
 | ||
| 
 | ||
|     # The maximum number of characters for text fields, to avoid DoS attacks via parsing huge text fields
 | ||
|     # https://gitlab.com/gitlab-org/gitlab-foss/issues/61974
 | ||
|     MAX_TEXT_SIZE_LIMIT = 1_000_000
 | ||
| 
 | ||
|     # Minimum schema version from which migrations are supported
 | ||
|     # Migrations before this version may have been removed
 | ||
|     MIN_SCHEMA_VERSION = 20190506135400
 | ||
|     MIN_SCHEMA_GITLAB_VERSION = '11.11.0'
 | ||
| 
 | ||
|     # Schema we store dynamically managed partitions in (e.g. for time partitioning)
 | ||
|     DYNAMIC_PARTITIONS_SCHEMA = :gitlab_partitions_dynamic
 | ||
| 
 | ||
|     # Schema we store static partitions in (e.g. for hash partitioning)
 | ||
|     STATIC_PARTITIONS_SCHEMA = :gitlab_partitions_static
 | ||
| 
 | ||
|     # This is an extensive list of postgres schemas owned by GitLab
 | ||
|     # It does not include the default public schema
 | ||
|     EXTRA_SCHEMAS = [DYNAMIC_PARTITIONS_SCHEMA, STATIC_PARTITIONS_SCHEMA].freeze
 | ||
| 
 | ||
|     def self.config
 | ||
|       ActiveRecord::Base.configurations[Rails.env]
 | ||
|     end
 | ||
| 
 | ||
|     def self.username
 | ||
|       config['username'] || ENV['USER']
 | ||
|     end
 | ||
| 
 | ||
|     def self.database_name
 | ||
|       config['database']
 | ||
|     end
 | ||
| 
 | ||
|     def self.adapter_name
 | ||
|       config['adapter']
 | ||
|     end
 | ||
| 
 | ||
|     def self.human_adapter_name
 | ||
|       if postgresql?
 | ||
|         'PostgreSQL'
 | ||
|       else
 | ||
|         'Unknown'
 | ||
|       end
 | ||
|     end
 | ||
| 
 | ||
|     # @deprecated
 | ||
|     def self.postgresql?
 | ||
|       adapter_name.casecmp('postgresql') == 0
 | ||
|     end
 | ||
| 
 | ||
|     def self.read_only?
 | ||
|       false
 | ||
|     end
 | ||
| 
 | ||
|     def self.read_write?
 | ||
|       !self.read_only?
 | ||
|     end
 | ||
| 
 | ||
|     # Check whether the underlying database is in read-only mode
 | ||
|     def self.db_read_only?
 | ||
|       pg_is_in_recovery =
 | ||
|         ActiveRecord::Base
 | ||
|           .connection
 | ||
|           .execute('SELECT pg_is_in_recovery()')
 | ||
|           .first
 | ||
|           .fetch('pg_is_in_recovery')
 | ||
| 
 | ||
|       Gitlab::Utils.to_boolean(pg_is_in_recovery)
 | ||
|     end
 | ||
| 
 | ||
|     def self.db_read_write?
 | ||
|       !self.db_read_only?
 | ||
|     end
 | ||
| 
 | ||
|     def self.version
 | ||
|       @version ||= database_version.match(/\A(?:PostgreSQL |)([^\s]+).*\z/)[1]
 | ||
|     end
 | ||
| 
 | ||
|     def self.postgresql_9_or_less?
 | ||
|       version.to_f < 10
 | ||
|     end
 | ||
| 
 | ||
|     def self.postgresql_minimum_supported_version?
 | ||
|       version.to_f >= MINIMUM_POSTGRES_VERSION
 | ||
|     end
 | ||
| 
 | ||
|     def self.postgresql_upcoming_deprecation?
 | ||
|       version.to_f < UPCOMING_POSTGRES_VERSION_DETAILS[:pg_version_minimum]
 | ||
|     end
 | ||
| 
 | ||
|     def self.days_until_deprecation
 | ||
|       (
 | ||
|         Date.parse(UPCOMING_POSTGRES_VERSION_DETAILS[:gl_version_date]) -
 | ||
|         Date.today
 | ||
|       ).to_i
 | ||
|     end
 | ||
|     private_class_method :days_until_deprecation
 | ||
| 
 | ||
|     def self.within_deprecation_notice_window?
 | ||
|       days_until_deprecation <= DEPRECATION_WINDOW_DAYS
 | ||
|     end
 | ||
| 
 | ||
|     def self.check_postgres_version_and_print_warning
 | ||
|       return if Gitlab::Database.postgresql_minimum_supported_version?
 | ||
|       return if Gitlab::Runtime.rails_runner?
 | ||
| 
 | ||
|       Kernel.warn ERB.new(Rainbow.new.wrap(<<~EOS).red).result
 | ||
| 
 | ||
|                   ██     ██  █████  ██████  ███    ██ ██ ███    ██  ██████ 
 | ||
|                   ██     ██ ██   ██ ██   ██ ████   ██ ██ ████   ██ ██      
 | ||
|                   ██  █  ██ ███████ ██████  ██ ██  ██ ██ ██ ██  ██ ██   ███ 
 | ||
|                   ██ ███ ██ ██   ██ ██   ██ ██  ██ ██ ██ ██  ██ ██ ██    ██ 
 | ||
|                    ███ ███  ██   ██ ██   ██ ██   ████ ██ ██   ████  ██████  
 | ||
| 
 | ||
|         ******************************************************************************
 | ||
|           You are using PostgreSQL <%= Gitlab::Database.version %>, but PostgreSQL >= <%= Gitlab::Database::MINIMUM_POSTGRES_VERSION %>
 | ||
|           is required for this version of GitLab.
 | ||
|           <% if Rails.env.development? || Rails.env.test? %>
 | ||
|           If using gitlab-development-kit, please find the relevant steps here:
 | ||
|             https://gitlab.com/gitlab-org/gitlab-development-kit/-/blob/master/doc/howto/postgresql.md#upgrade-postgresql
 | ||
|           <% end %>
 | ||
|           Please upgrade your environment to a supported PostgreSQL version, see
 | ||
|           https://docs.gitlab.com/ee/install/requirements.html#database for details.
 | ||
|         ******************************************************************************
 | ||
|       EOS
 | ||
|     rescue ActiveRecord::ActiveRecordError, PG::Error
 | ||
|       # ignore - happens when Rake tasks yet have to create a database, e.g. for testing
 | ||
|     end
 | ||
| 
 | ||
|     # map some of the function names that changed between PostgreSQL 9 and 10
 | ||
|     # https://wiki.postgresql.org/wiki/New_in_postgres_10
 | ||
|     def self.pg_wal_lsn_diff
 | ||
|       Gitlab::Database.postgresql_9_or_less? ? 'pg_xlog_location_diff' : 'pg_wal_lsn_diff'
 | ||
|     end
 | ||
| 
 | ||
|     def self.pg_current_wal_insert_lsn
 | ||
|       Gitlab::Database.postgresql_9_or_less? ? 'pg_current_xlog_insert_location' : 'pg_current_wal_insert_lsn'
 | ||
|     end
 | ||
| 
 | ||
|     def self.pg_last_wal_receive_lsn
 | ||
|       Gitlab::Database.postgresql_9_or_less? ? 'pg_last_xlog_receive_location' : 'pg_last_wal_receive_lsn'
 | ||
|     end
 | ||
| 
 | ||
|     def self.pg_last_wal_replay_lsn
 | ||
|       Gitlab::Database.postgresql_9_or_less? ? 'pg_last_xlog_replay_location' : 'pg_last_wal_replay_lsn'
 | ||
|     end
 | ||
| 
 | ||
|     def self.pg_last_xact_replay_timestamp
 | ||
|       'pg_last_xact_replay_timestamp'
 | ||
|     end
 | ||
| 
 | ||
|     def self.nulls_last_order(field, direction = 'ASC')
 | ||
|       Arel.sql("#{field} #{direction} NULLS LAST")
 | ||
|     end
 | ||
| 
 | ||
|     def self.nulls_first_order(field, direction = 'ASC')
 | ||
|       Arel.sql("#{field} #{direction} NULLS FIRST")
 | ||
|     end
 | ||
| 
 | ||
|     def self.random
 | ||
|       "RANDOM()"
 | ||
|     end
 | ||
| 
 | ||
|     def self.true_value
 | ||
|       "'t'"
 | ||
|     end
 | ||
| 
 | ||
|     def self.false_value
 | ||
|       "'f'"
 | ||
|     end
 | ||
| 
 | ||
|     def self.with_connection_pool(pool_size)
 | ||
|       pool = create_connection_pool(pool_size)
 | ||
| 
 | ||
|       begin
 | ||
|         yield(pool)
 | ||
|       ensure
 | ||
|         pool.disconnect!
 | ||
|       end
 | ||
|     end
 | ||
| 
 | ||
|     # Bulk inserts a number of rows into a table, optionally returning their
 | ||
|     # IDs.
 | ||
|     #
 | ||
|     # table - The name of the table to insert the rows into.
 | ||
|     # rows - An Array of Hash instances, each mapping the columns to their
 | ||
|     #        values.
 | ||
|     # return_ids - When set to true the return value will be an Array of IDs of
 | ||
|     #              the inserted rows
 | ||
|     # disable_quote - A key or an Array of keys to exclude from quoting (You
 | ||
|     #                 become responsible for protection from SQL injection for
 | ||
|     #                 these keys!)
 | ||
|     # on_conflict - Defines an upsert. Values can be: :disabled (default) or
 | ||
|     #               :do_nothing
 | ||
|     def self.bulk_insert(table, rows, return_ids: false, disable_quote: [], on_conflict: nil)
 | ||
|       return if rows.empty?
 | ||
| 
 | ||
|       keys = rows.first.keys
 | ||
|       columns = keys.map { |key| connection.quote_column_name(key) }
 | ||
| 
 | ||
|       disable_quote = Array(disable_quote).to_set
 | ||
|       tuples = rows.map do |row|
 | ||
|         keys.map do |k|
 | ||
|           disable_quote.include?(k) ? row[k] : connection.quote(row[k])
 | ||
|         end
 | ||
|       end
 | ||
| 
 | ||
|       sql = <<-EOF
 | ||
|         INSERT INTO #{table} (#{columns.join(', ')})
 | ||
|         VALUES #{tuples.map { |tuple| "(#{tuple.join(', ')})" }.join(', ')}
 | ||
|       EOF
 | ||
| 
 | ||
|       sql = "#{sql} ON CONFLICT DO NOTHING" if on_conflict == :do_nothing
 | ||
| 
 | ||
|       sql = "#{sql} RETURNING id" if return_ids
 | ||
| 
 | ||
|       result = connection.execute(sql)
 | ||
| 
 | ||
|       if return_ids
 | ||
|         result.values.map { |tuple| tuple[0].to_i }
 | ||
|       else
 | ||
|         []
 | ||
|       end
 | ||
|     end
 | ||
| 
 | ||
|     def self.sanitize_timestamp(timestamp)
 | ||
|       MAX_TIMESTAMP_VALUE > timestamp ? timestamp : MAX_TIMESTAMP_VALUE.dup
 | ||
|     end
 | ||
| 
 | ||
|     # pool_size - The size of the DB pool.
 | ||
|     # host - An optional host name to use instead of the default one.
 | ||
|     def self.create_connection_pool(pool_size, host = nil, port = nil)
 | ||
|       env = Rails.env
 | ||
|       original_config = ActiveRecord::Base.configurations.to_h
 | ||
| 
 | ||
|       env_config = original_config[env].merge('pool' => pool_size)
 | ||
|       env_config['host'] = host if host
 | ||
|       env_config['port'] = port if port
 | ||
| 
 | ||
|       config = ActiveRecord::DatabaseConfigurations.new(
 | ||
|         original_config.merge(env => env_config)
 | ||
|       )
 | ||
| 
 | ||
|       spec =
 | ||
|         ActiveRecord::
 | ||
|           ConnectionAdapters::
 | ||
|           ConnectionSpecification::Resolver.new(config).spec(env.to_sym)
 | ||
| 
 | ||
|       ActiveRecord::ConnectionAdapters::ConnectionPool.new(spec)
 | ||
|     end
 | ||
| 
 | ||
|     def self.connection
 | ||
|       ActiveRecord::Base.connection
 | ||
|     end
 | ||
|     private_class_method :connection
 | ||
| 
 | ||
|     def self.cached_column_exists?(table_name, column_name)
 | ||
|       connection.schema_cache.columns_hash(table_name).has_key?(column_name.to_s)
 | ||
|     end
 | ||
| 
 | ||
|     def self.cached_table_exists?(table_name)
 | ||
|       exists? && connection.schema_cache.data_source_exists?(table_name)
 | ||
|     end
 | ||
| 
 | ||
|     def self.database_version
 | ||
|       row = connection.execute("SELECT VERSION()").first
 | ||
| 
 | ||
|       row['version']
 | ||
|     end
 | ||
| 
 | ||
|     def self.exists?
 | ||
|       connection
 | ||
| 
 | ||
|       true
 | ||
|     rescue
 | ||
|       false
 | ||
|     end
 | ||
| 
 | ||
|     private_class_method :database_version
 | ||
| 
 | ||
|     def self.add_post_migrate_path_to_rails(force: false)
 | ||
|       return if ENV['SKIP_POST_DEPLOYMENT_MIGRATIONS'] && !force
 | ||
| 
 | ||
|       Rails.application.config.paths['db'].each do |db_path|
 | ||
|         path = Rails.root.join(db_path, 'post_migrate').to_s
 | ||
| 
 | ||
|         unless Rails.application.config.paths['db/migrate'].include? path
 | ||
|           Rails.application.config.paths['db/migrate'] << path
 | ||
| 
 | ||
|           # Rails memoizes migrations at certain points where it won't read the above
 | ||
|           # path just yet. As such we must also update the following list of paths.
 | ||
|           ActiveRecord::Migrator.migrations_paths << path
 | ||
|         end
 | ||
|       end
 | ||
|     end
 | ||
| 
 | ||
|     # inside_transaction? will return true if the caller is running within a transaction. Handles special cases
 | ||
|     # when running inside a test environment, where tests may be wrapped in transactions
 | ||
|     def self.inside_transaction?
 | ||
|       if Rails.env.test?
 | ||
|         ActiveRecord::Base.connection.open_transactions > open_transactions_baseline
 | ||
|       else
 | ||
|         ActiveRecord::Base.connection.open_transactions > 0
 | ||
|       end
 | ||
|     end
 | ||
| 
 | ||
|     # These methods that access @open_transactions_baseline are not thread-safe.
 | ||
|     # These are fine though because we only call these in RSpec's main thread. If we decide to run
 | ||
|     # specs multi-threaded, we would need to use something like ThreadGroup to keep track of this value
 | ||
|     def self.set_open_transactions_baseline
 | ||
|       @open_transactions_baseline = ActiveRecord::Base.connection.open_transactions
 | ||
|     end
 | ||
| 
 | ||
|     def self.reset_open_transactions_baseline
 | ||
|       @open_transactions_baseline = 0
 | ||
|     end
 | ||
| 
 | ||
|     def self.open_transactions_baseline
 | ||
|       @open_transactions_baseline ||= 0
 | ||
|     end
 | ||
|     private_class_method :open_transactions_baseline
 | ||
| 
 | ||
|     # Monkeypatch rails with upgraded database observability
 | ||
|     def self.install_monkey_patches
 | ||
|       ActiveRecord::Base.prepend(ActiveRecordBaseTransactionMetrics)
 | ||
|     end
 | ||
| 
 | ||
|     # observe_transaction_duration is called from ActiveRecordBaseTransactionMetrics.transaction and used to
 | ||
|     # record transaction durations.
 | ||
|     def self.observe_transaction_duration(duration_seconds)
 | ||
|       if current_transaction = ::Gitlab::Metrics::Transaction.current
 | ||
|         current_transaction.observe(:gitlab_database_transaction_seconds, duration_seconds) do
 | ||
|           docstring "Time spent in database transactions, in seconds"
 | ||
|         end
 | ||
|       end
 | ||
|     rescue Prometheus::Client::LabelSetValidator::LabelSetError => err
 | ||
|       # Ensure that errors in recording these metrics don't affect the operation of the application
 | ||
|       Rails.logger.error("Unable to observe database transaction duration: #{err}") # rubocop:disable Gitlab/RailsLogger
 | ||
|     end
 | ||
| 
 | ||
|     # MonkeyPatch for ActiveRecord::Base for adding observability
 | ||
|     module ActiveRecordBaseTransactionMetrics
 | ||
|       # A monkeypatch over ActiveRecord::Base.transaction.
 | ||
|       # It provides observability into transactional methods.
 | ||
|       def transaction(options = {}, &block)
 | ||
|         start_time = Gitlab::Metrics::System.monotonic_time
 | ||
|         super(options, &block)
 | ||
|       ensure
 | ||
|         Gitlab::Database.observe_transaction_duration(Gitlab::Metrics::System.monotonic_time - start_time)
 | ||
|       end
 | ||
|     end
 | ||
|   end
 | ||
| end
 | ||
| 
 | ||
| Gitlab::Database.prepend_if_ee('EE::Gitlab::Database')
 |