summaryrefslogtreecommitdiff
path: root/lib/gitlab/database/reindexing/index_selection.rb
blob: 2d384f2f9e23e0452cdb6300e26c1c183a48f5cd (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
# frozen_string_literal: true

module Gitlab
  module Database
    module Reindexing
      class IndexSelection
        include Enumerable

        # Only reindex indexes with a relative bloat level (bloat estimate / size) higher than this
        MINIMUM_RELATIVE_BLOAT = 0.2

        # Only consider indexes beyond this size (before reindexing)
        INDEX_SIZE_MINIMUM = 1.gigabyte

        delegate :each, to: :indexes

        def initialize(candidates)
          @candidates = candidates
        end

        private

        attr_reader :candidates

        def indexes
          # This is an explicit N+1 query:
          # Bloat estimates are generally available through a view
          # for all indexes. However, estimating bloat for all
          # indexes at once is an expensive operation. Therefore,
          # we force a N+1 pattern here and estimate bloat on a per-index
          # basis.

          @indexes ||= candidates
            .not_recently_reindexed
            .where('ondisk_size_bytes >= ?', INDEX_SIZE_MINIMUM)
            .sort_by(&:relative_bloat_level) # forced N+1
            .reverse
            .select { |candidate| candidate.relative_bloat_level >= MINIMUM_RELATIVE_BLOAT }
        end
      end
    end
  end
end