summaryrefslogtreecommitdiff
path: root/app/services/ci/destroy_expired_job_artifacts_service.rb
blob: d91cfb3cc8299ff9c517ca351b3138d60897046d (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
# frozen_string_literal: true

module Ci
  class DestroyExpiredJobArtifactsService
    include ::Gitlab::ExclusiveLeaseHelpers
    include ::Gitlab::LoopHelpers

    BATCH_SIZE = 100
    LOOP_TIMEOUT = 5.minutes
    LOOP_LIMIT = 1000
    EXCLUSIVE_LOCK_KEY = 'expired_job_artifacts:destroy:lock'
    LOCK_TIMEOUT = 6.minutes

    def initialize
      @removed_artifacts_count = 0
    end

    ##
    # Destroy expired job artifacts on GitLab instance
    #
    # This destroy process cannot run for more than 6 minutes. This is for
    # preventing multiple `ExpireBuildArtifactsWorker` CRON jobs run concurrently,
    # which is scheduled every 7 minutes.
    def execute
      in_lock(EXCLUSIVE_LOCK_KEY, ttl: LOCK_TIMEOUT, retries: 1) do
        destroy_job_artifacts_with_slow_iteration(Time.current)
      end

      @removed_artifacts_count
    end

    private

    def destroy_job_artifacts_with_slow_iteration(start_at)
      Ci::JobArtifact.expired_before(start_at).each_batch(of: BATCH_SIZE, column: :expire_at, order: :desc) do |relation, index|
        # For performance reasons, join with ci_pipelines after the batch is queried.
        # See: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/47496
        artifacts = relation.unlocked

        service_response = destroy_batch_async(artifacts)
        @removed_artifacts_count += service_response[:destroyed_artifacts_count]

        break if loop_timeout?(start_at)
        break if index >= LOOP_LIMIT
      end
    end

    def destroy_batch_async(artifacts)
      Ci::JobArtifactsDestroyBatchService.new(artifacts).execute
    end

    def loop_timeout?(start_at)
      Time.current > start_at + LOOP_TIMEOUT
    end
  end
end