Skip to content

Commit

Permalink
Merge branch 'fix/gh-import-status-check' into 'master'
Browse files Browse the repository at this point in the history
Periodically mark projects that are stuck in importing as failed

Closes #17709

See merge request !10207
  • Loading branch information
smcgivern committed Apr 6, 2017
2 parents dc20dd1 + 94716c2 commit 6185429
Show file tree
Hide file tree
Showing 13 changed files with 129 additions and 5 deletions.
4 changes: 3 additions & 1 deletion app/workers/repository_import_worker.rb
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,8 @@ class RepositoryImportWorker
include Sidekiq::Worker
include DedicatedSidekiqQueue

sidekiq_options status_expiration: StuckImportJobsWorker::IMPORT_EXPIRATION

attr_accessor :project, :current_user

def perform(project_id)
Expand All @@ -12,7 +14,7 @@ def perform(project_id)
import_url: @project.import_url,
path: @project.path_with_namespace)

project.update_column(:import_error, nil)
project.update_columns(import_jid: self.jid, import_error: nil)

result = Projects::ImportService.new(project, current_user).execute

Expand Down
37 changes: 37 additions & 0 deletions app/workers/stuck_import_jobs_worker.rb
Original file line number Diff line number Diff line change
@@ -0,0 +1,37 @@
class StuckImportJobsWorker
include Sidekiq::Worker
include CronjobQueue

IMPORT_EXPIRATION = 15.hours.to_i

def perform
stuck_projects.find_in_batches(batch_size: 500) do |group|
jids = group.map(&:import_jid)

# Find the jobs that aren't currently running or that exceeded the threshold.
completed_jids = Gitlab::SidekiqStatus.completed_jids(jids)

if completed_jids.any?
completed_ids = group.select { |project| completed_jids.include?(project.import_jid) }.map(&:id)

fail_batch!(completed_jids, completed_ids)
end
end
end

private

def stuck_projects
Project.select('id, import_jid').with_import_status(:started).where.not(import_jid: nil)
end

def fail_batch!(completed_jids, completed_ids)
Project.where(id: completed_ids).update_all(import_status: 'failed', import_error: error_message)

Rails.logger.info("Marked stuck import jobs as failed. JIDs: #{completed_jids.join(', ')}")
end

def error_message
"Import timed out. Import took longer than #{IMPORT_EXPIRATION} seconds"
end
end
4 changes: 4 additions & 0 deletions changelogs/unreleased/fix-gh-import-status-check.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,4 @@
---
title: Periodically mark projects that are stuck in importing as failed
merge_request:
author:
3 changes: 3 additions & 0 deletions config/initializers/1_settings.rb
Original file line number Diff line number Diff line change
Expand Up @@ -349,6 +349,9 @@ def host(url)
Settings.cron_jobs['remove_unreferenced_lfs_objects_worker'] ||= Settingslogic.new({})
Settings.cron_jobs['remove_unreferenced_lfs_objects_worker']['cron'] ||= '20 0 * * *'
Settings.cron_jobs['remove_unreferenced_lfs_objects_worker']['job_class'] = 'RemoveUnreferencedLfsObjectsWorker'
Settings.cron_jobs['stuck_import_jobs_worker'] ||= Settingslogic.new({})
Settings.cron_jobs['stuck_import_jobs_worker']['cron'] ||= '15 * * * *'
Settings.cron_jobs['stuck_import_jobs_worker']['job_class'] = 'StuckImportJobsWorker'

#
# GitLab Shell
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,9 @@ class AddIndexToProjectAuthorizations < ActiveRecord::Migration
disable_ddl_transaction!

def up
add_concurrent_index(:project_authorizations, :project_id)
unless index_exists?(:project_authorizations, :project_id)
add_concurrent_index(:project_authorizations, :project_id)
end
end

def down
Expand Down
9 changes: 9 additions & 0 deletions db/migrate/20170405080720_add_import_jid_to_projects.rb
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
class AddImportJidToProjects < ActiveRecord::Migration
include Gitlab::Database::MigrationHelpers

DOWNTIME = false

def change
add_column :projects, :import_jid, :string
end
end
3 changes: 2 additions & 1 deletion db/schema.rb
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@
#
# It's strongly recommended that you check this file into your version control system.

ActiveRecord::Schema.define(version: 20170402231018) do
ActiveRecord::Schema.define(version: 20170405080720) do

# These are extensions that must be enabled in order to support this database
enable_extension "plpgsql"
Expand Down Expand Up @@ -920,6 +920,7 @@
t.text "description_html"
t.boolean "only_allow_merge_if_all_discussions_are_resolved"
t.boolean "printing_merge_request_link_enabled", default: true, null: false
t.string "import_jid"
end

add_index "projects", ["ci_id"], name: "index_projects_on_ci_id", using: :btree
Expand Down
13 changes: 13 additions & 0 deletions lib/gitlab/sidekiq_status.rb
Original file line number Diff line number Diff line change
Expand Up @@ -72,6 +72,8 @@ def self.num_completed(job_ids)
# job_ids - The Sidekiq job IDs to check.
#
# Returns an array of true or false indicating job completion.
# true = job is still running
# false = job completed
def self.job_status(job_ids)
keys = job_ids.map { |jid| key_for(jid) }

Expand All @@ -82,6 +84,17 @@ def self.job_status(job_ids)
end
end

# Returns the JIDs that are completed
#
# job_ids - The Sidekiq job IDs to check.
#
# Returns an array of completed JIDs
def self.completed_jids(job_ids)
Sidekiq.redis do |redis|
job_ids.reject { |jid| redis.exists(key_for(jid)) }
end
end

def self.key_for(jid)
STATUS_KEY % jid
end
Expand Down
4 changes: 3 additions & 1 deletion lib/gitlab/sidekiq_status/client_middleware.rb
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,9 @@ module Gitlab
module SidekiqStatus
class ClientMiddleware
def call(_, job, _, _)
Gitlab::SidekiqStatus.set(job['jid'])
status_expiration = job['status_expiration'] || Gitlab::SidekiqStatus::DEFAULT_EXPIRATION

Gitlab::SidekiqStatus.set(job['jid'], status_expiration)
yield
end
end
Expand Down
2 changes: 1 addition & 1 deletion spec/lib/gitlab/sidekiq_status/client_middleware_spec.rb
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,7 @@
describe Gitlab::SidekiqStatus::ClientMiddleware do
describe '#call' do
it 'tracks the job in Redis' do
expect(Gitlab::SidekiqStatus).to receive(:set).with('123')
expect(Gitlab::SidekiqStatus).to receive(:set).with('123', Gitlab::SidekiqStatus::DEFAULT_EXPIRATION)

described_class.new.
call('Foo', { 'jid' => '123' }, double(:queue), double(:pool)) { nil }
Expand Down
13 changes: 13 additions & 0 deletions spec/lib/gitlab/sidekiq_status_spec.rb
Original file line number Diff line number Diff line change
Expand Up @@ -73,4 +73,17 @@
expect(key).to include('123')
end
end

describe 'completed', :redis do
it 'returns the completed job' do
expect(described_class.completed_jids(%w(123))).to eq(['123'])
end

it 'returns only the jobs completed' do
described_class.set('123')
described_class.set('456')

expect(described_class.completed_jids(%w(123 456 789))).to eq(['789'])
end
end
end
2 changes: 2 additions & 0 deletions spec/workers/repository_import_worker_spec.rb
Original file line number Diff line number Diff line change
Expand Up @@ -23,10 +23,12 @@
error = %q{remote: Not Found fatal: repository 'https://user:pass@test.com/root/repoC.git/' not found }
expect_any_instance_of(Projects::ImportService).to receive(:execute).
and_return({ status: :error, message: error })
allow(subject).to receive(:jid).and_return('123')

subject.perform(project.id)

expect(project.reload.import_error).to include("https://*****:*****@test.com/root/repoC.git/")
expect(project.reload.import_jid).not_to be_nil
end
end
end
Expand Down
36 changes: 36 additions & 0 deletions spec/workers/stuck_import_jobs_worker_spec.rb
Original file line number Diff line number Diff line change
@@ -0,0 +1,36 @@
require 'spec_helper'

describe StuckImportJobsWorker do
let(:worker) { described_class.new }
let(:exclusive_lease_uuid) { SecureRandom.uuid }

before do
allow_any_instance_of(Gitlab::ExclusiveLease).to receive(:try_obtain).and_return(exclusive_lease_uuid)
end

describe 'long running import' do
let(:project) { create(:empty_project, import_jid: '123', import_status: 'started') }

before do
allow(Gitlab::SidekiqStatus).to receive(:completed_jids).and_return(['123'])
end

it 'marks the project as failed' do
expect { worker.perform }.to change { project.reload.import_status }.to('failed')
end
end

describe 'running import' do
let(:project) { create(:empty_project, import_jid: '123', import_status: 'started') }

before do
allow(Gitlab::SidekiqStatus).to receive(:completed_jids).and_return([])
end

it 'does not mark the project as failed' do
worker.perform

expect(project.reload.import_status).to eq('started')
end
end
end

0 comments on commit 6185429

Please sign in to comment.