diff options
author | Sean McGivern <sean@gitlab.com> | 2018-07-03 13:23:17 +0100 |
---|---|---|
committer | Oswaldo Ferreira <oswaldo@gitlab.com> | 2018-07-10 09:43:57 -0300 |
commit | 3acf7ba9caf19b1a02b34071454a631c959b5c58 (patch) | |
tree | 7b77ee8a8367b5da887790d833e34fa1693962a3 /db/post_migrate | |
parent | 3d4873fa64c833c71ab7ee274002d854eb93ef96 (diff) | |
download | gitlab-ce-3acf7ba9caf19b1a02b34071454a631c959b5c58.tar.gz |
Revert "Temporarily remove MR diffs removal migration"
This reverts commit 15ec6a13eb4d839d252315bf5b0a50d28351cb5f.
Diffstat (limited to 'db/post_migrate')
-rw-r--r-- | db/post_migrate/20180619121030_enqueue_delete_diff_files_workers.rb | 70 |
1 files changed, 70 insertions, 0 deletions
diff --git a/db/post_migrate/20180619121030_enqueue_delete_diff_files_workers.rb b/db/post_migrate/20180619121030_enqueue_delete_diff_files_workers.rb new file mode 100644 index 00000000000..5fb3d545624 --- /dev/null +++ b/db/post_migrate/20180619121030_enqueue_delete_diff_files_workers.rb @@ -0,0 +1,70 @@ +class EnqueueDeleteDiffFilesWorkers < ActiveRecord::Migration + include Gitlab::Database::MigrationHelpers + + class MergeRequestDiff < ActiveRecord::Base + self.table_name = 'merge_request_diffs' + + belongs_to :merge_request + + include EachBatch + end + + DOWNTIME = false + BATCH_SIZE = 1000 + MIGRATION = 'DeleteDiffFiles' + DELAY_INTERVAL = 8.minutes + TMP_INDEX = 'tmp_partial_diff_id_with_files_index'.freeze + + disable_ddl_transaction! + + def up + # We add temporary index, to make iteration over batches more performant. + # Conditional here is to avoid the need of doing that in a separate + # migration file to make this operation idempotent. + # + unless index_exists_by_name?(:merge_request_diffs, TMP_INDEX) + add_concurrent_index(:merge_request_diffs, :id, where: "(state NOT IN ('without_files', 'empty'))", name: TMP_INDEX) + end + + + diffs_with_files = MergeRequestDiff.where.not(state: ['without_files', 'empty']) + + # explain (analyze, buffers) example for the iteration: + # + # Index Only Scan using tmp_index_20013 on merge_request_diffs (cost=0.43..1630.19 rows=60567 width=4) (actual time=0.047..9.572 rows=56976 loops=1) + # Index Cond: ((id >= 764586) AND (id < 835298)) + # Heap Fetches: 8 + # Buffers: shared hit=18188 + # Planning time: 0.752 ms + # Execution time: 12.430 ms + # + diffs_with_files.each_batch(of: BATCH_SIZE) do |relation, outer_index| + ids = relation.pluck(:id) + + ids.each_with_index do |diff_id, inner_index| + # This will give some space between batches of workers. + interval = DELAY_INTERVAL * outer_index + inner_index.minutes + + # A single `merge_request_diff` can be associated with way too many + # `merge_request_diff_files`. It's better to avoid batching these and + # schedule one at a time. + # + # Considering roughly 6M jobs, this should take ~30 days to process all + # of them. + # + BackgroundMigrationWorker.perform_in(interval, MIGRATION, [diff_id]) + end + end + + # We remove temporary index, because it is not required during standard + # operations and runtime. + # + remove_concurrent_index_by_name(:merge_request_diffs, TMP_INDEX) + end + + def down + if index_exists_by_name?(:merge_request_diffs, TMP_INDEX) + remove_concurrent_index_by_name(:merge_request_diffs, TMP_INDEX) + end + end +end |