summaryrefslogtreecommitdiff
path: root/app/workers
diff options
context:
space:
mode:
authorToon Claes <toon@gitlab.com>2018-05-02 20:05:40 +0200
committerToon Claes <toon@gitlab.com>2018-05-07 09:42:09 +0200
commitaafd78c57f8a4429c2670faeb93ebfccfff0bb29 (patch)
tree1fdf0f9565406413084c61098f48e22fb6ac480b /app/workers
parent7bd8d2e2f69f4a0ff801aa7d99b86d7bc714c1a0 (diff)
downloadgitlab-ce-aafd78c57f8a4429c2670faeb93ebfccfff0bb29.tar.gz
Refactor RepositoryCheck::BatchWorker
For easier overriding methods.
Diffstat (limited to 'app/workers')
-rw-r--r--app/workers/repository_check/batch_worker.rb31
1 files changed, 23 insertions, 8 deletions
diff --git a/app/workers/repository_check/batch_worker.rb b/app/workers/repository_check/batch_worker.rb
index a76ae3abbe7..9aceb512d34 100644
--- a/app/workers/repository_check/batch_worker.rb
+++ b/app/workers/repository_check/batch_worker.rb
@@ -4,6 +4,7 @@ module RepositoryCheck
include CronjobQueue
RUN_TIME = 3600
+ BATCH_SIZE = 10_000
def perform
return unless Gitlab::CurrentSettings.repository_checks_enabled
@@ -15,7 +16,7 @@ module RepositoryCheck
# projects to check. By default sidekiq-cron will start a new
# RepositoryCheckWorker each hour so that as long as there are repositories to
# check, only one (or two) will be checked at a time.
- project_ids.each do |project_id|
+ find_batch.each do |project_id|
break if Time.now - start >= RUN_TIME
next unless try_obtain_lease(project_id)
@@ -31,13 +32,27 @@ module RepositoryCheck
# array of ID's. This is OK because we do it only once an hour, because
# getting ID's from Postgres is not terribly slow, and because no user
# has to sit and wait for this query to finish.
- def project_ids
- limit = 10_000
- never_checked_projects = Project.where('last_repository_check_at IS NULL AND created_at < ?', 24.hours.ago)
- .limit(limit).pluck(:id)
- old_check_projects = Project.where('last_repository_check_at < ?', 1.month.ago)
- .reorder('last_repository_check_at ASC').limit(limit).pluck(:id)
- never_checked_projects + old_check_projects
+ def find_batch(batch_size = BATCH_SIZE)
+ project_ids = never_checked_project_ids(batch_size)
+
+ remaining_capacity = batch_size - project_ids.count
+
+ if remaining_capacity > 0
+ project_ids + old_checked_project_ids(remaining_capacity)
+ else
+ project_ids
+ end
+ end
+
+ def never_checked_project_ids(batch_size)
+ Project.where('last_repository_check_at IS NULL AND created_at < ?', 24.hours.ago)
+ .limit(batch_size).pluck(:id)
+ end
+
+ def old_checked_project_ids(batch_size)
+ Project.where('last_repository_check_at < ?', 1.month.ago)
+ .reorder(last_repository_check_at: :asc)
+ .limit(batch_size).pluck(:id)
end
def try_obtain_lease(id)