Skip to content

Commit 12f666c

Browse files
authored
Merge pull request #2212 from broadinstitute/jb-pairwise-de-api
API integration for user-submitted differential expression calculations (SCP-5767)
2 parents 22c1ead + a27746c commit 12f666c

11 files changed

+454
-85
lines changed

app/controllers/api/v1/site_controller.rb

+151-2
Original file line numberDiff line numberDiff line change
@@ -2,8 +2,8 @@ module Api
22
module V1
33
class SiteController < ApiBaseController
44
before_action :set_current_api_user!
5-
before_action :authenticate_api_user!, only: [:download_data, :stream_data, :get_study_analysis_config,
6-
:submit_study_analysis, :get_study_submissions,
5+
before_action :authenticate_api_user!, only: [:download_data, :stream_data, :submit_differential_expression,
6+
:get_study_analysis_config, :submit_study_analysis, :get_study_submissions,
77
:get_study_submission, :sync_submission_outputs]
88
before_action :set_study, except: [:studies, :check_terra_tos_acceptance, :analyses, :get_analysis, :renew_user_access_token]
99
before_action :set_analysis_configuration, only: [:get_analysis, :get_study_analysis_config]
@@ -403,6 +403,151 @@ def stream_data
403403
end
404404
end
405405

406+
swagger_path '/site/studies/{accession}/differential_expression' do
407+
operation :post do
408+
key :tags, [
409+
'Site'
410+
]
411+
key :summary, 'Submit a differential expression calculation request'
412+
key :description, 'Request differential expression calculations for a given cluster/annotation in a study'
413+
key :operationId, 'site_study_submit_differential_expression_path'
414+
parameter do
415+
key :name, :accession
416+
key :in, :path
417+
key :description, 'Accession of Study to use'
418+
key :required, true
419+
key :type, :string
420+
end
421+
parameter do
422+
key :name, :de_job
423+
key :type, :object
424+
key :in, :body
425+
schema do
426+
property :cluster_name do
427+
key :description, 'Name of cluster group. Use "_default" to use the default cluster'
428+
key :required, true
429+
key :type, :string
430+
end
431+
property :annotation_name do
432+
key :description, 'Name of annotation'
433+
key :required, true
434+
key :type, :string
435+
end
436+
property :annotation_scope do
437+
key :description, 'Scope of annotation. One of "study" or "cluster".'
438+
key :type, :string
439+
key :required, true
440+
key :enum, Api::V1::Visualization::AnnotationsController::VALID_SCOPE_VALUES
441+
end
442+
property :de_type do
443+
key :description, 'Type of differential expression analysis. Either "rest" (one-vs-rest) or "pairwise"'
444+
key :type, :string
445+
key :required, true
446+
key :enum, %w[rest pairwise]
447+
end
448+
property :group1 do
449+
key :description, 'First group for pairwise analysis (optional)'
450+
key :type, :string
451+
end
452+
property :group2 do
453+
key :description, 'Second group for pairwise analysis (optional)'
454+
key :type, :string
455+
end
456+
end
457+
end
458+
response 204 do
459+
key :description, 'Job successfully submitted'
460+
end
461+
response 401 do
462+
key :description, ApiBaseController.unauthorized
463+
end
464+
response 403 do
465+
key :description, ApiBaseController.forbidden('view study, study has author DE')
466+
end
467+
response 404 do
468+
key :description, ApiBaseController.not_found(Study, 'Cluster', 'Annotation')
469+
end
470+
response 406 do
471+
key :description, ApiBaseController.not_acceptable
472+
end
473+
response 409 do
474+
key :description, "Results are processing or already exist"
475+
end
476+
response 410 do
477+
key :description, ApiBaseController.resource_gone
478+
end
479+
response 422 do
480+
key :description, "Job parameters failed validation"
481+
end
482+
response 429 do
483+
key :description, 'Weekly user quota exceeded'
484+
end
485+
end
486+
end
487+
488+
def submit_differential_expression
489+
# disallow DE calculation requests for studies with author DE
490+
if @study.differential_expression_results.where(is_author_de: true).any?
491+
render json: {
492+
error: 'User requests are disabled for this study as it contains author-supplied differential expression results'
493+
}, status: 403 and return
494+
end
495+
496+
# check user quota before proceeding
497+
if DifferentialExpressionService.job_exceeds_quota?(current_api_user)
498+
# minimal log props to help gauge overall user interest, as well as annotation/de types
499+
log_props = {
500+
studyAccession: @study.accession, annotationName: params[:annotation_name], de_type: params[:de_type]
501+
}
502+
MetricsService.log('quota-exceeded-de', log_props, current_api_user, request:)
503+
current_quota = DifferentialExpressionService.get_weekly_user_quota
504+
render json: { error: "You have exceeded your weekly quota of #{current_quota} requests" },
505+
status: 429 and return
506+
end
507+
508+
cluster_name = params[:cluster_name]
509+
cluster = cluster_name == '_default' ? @study.default_cluster : @study.cluster_groups.by_name(cluster_name)
510+
render json: { error: "Requested cluster #{cluster_name} not found" }, status: 404 and return if cluster.nil?
511+
512+
annotation_name = params[:annotation_name]
513+
annotation_scope = params[:annotation_scope]
514+
de_type = params[:de_type]
515+
pairwise = de_type == 'pairwise'
516+
group1 = params[:group1]
517+
group2 = params[:group2]
518+
annotation = AnnotationVizService.get_selected_annotation(
519+
@study, cluster:, annot_name: annotation_name, annot_type: 'group', annot_scope: annotation_scope
520+
)
521+
render json: { error: 'No matching annotation found' }, status: 404 and return if annotation.nil?
522+
523+
de_params = { annotation_name:, annotation_scope:, de_type:, group1:, group2: }
524+
525+
# check if these results already exist
526+
# for pairwise, also check if requested comparisons exist
527+
result = DifferentialExpressionResult.find_by(
528+
study: @study, cluster_group: cluster, annotation_name:, annotation_scope:, is_author_de: false
529+
)
530+
if result && (!pairwise || (pairwise && result.has_pairwise_comparison?(group1, group2)))
531+
render json: { error: "Requested results already exist" }, status: 409 and return
532+
end
533+
534+
begin
535+
submitted = DifferentialExpressionService.run_differential_expression_job(
536+
cluster, @study, current_api_user, **de_params
537+
)
538+
if submitted
539+
DifferentialExpressionService.increment_user_quota(current_api_user)
540+
head 204
541+
else
542+
# submitted: false here means that there is a matching running DE job
543+
render json: { error: "Requested results are processing - please check back later" }, status: 409
544+
end
545+
rescue ArgumentError => e
546+
# job parameters failed to validate
547+
render json: { error: e.message}, status: 422 and return
548+
end
549+
end
550+
406551
swagger_path '/site/analyses' do
407552
operation :get do
408553
key :tags, [
@@ -1136,6 +1281,10 @@ def get_download_quota
11361281
end
11371282
end
11381283

1284+
def de_job_params
1285+
params.require(:de_job).permit(:cluster_name, :annotation_name, :annotation_scope, :de_type, :group1, :group2)
1286+
end
1287+
11391288
# update AnalysisSubmissions when loading study analysis tab
11401289
# will not backfill existing workflows to keep our submission history clean
11411290
def update_analysis_submission(submission)

app/lib/differential_expression_service.rb

+61-20
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,8 @@ class DifferentialExpressionService
99
ALLOWED_ANNOTS = Regexp.union(CELL_TYPE_MATCHER, CLUSTERING_MATCHER)
1010
# specific annotations to exclude from automation
1111
EXCLUDED_ANNOTS = /(enrichment__cell_type)/i
12+
# default quota for user-requested DE jobs
13+
DEFAULT_USER_QUOTA = 5
1214

1315
# run a differential expression job for a given study on the default cluster/annotation
1416
#
@@ -163,25 +165,27 @@ def self.run_differential_expression_job(cluster_group, study, user, annotation_
163165
params_object.machine_type = machine_type if machine_type.present? # override :machine_type if specified
164166
return true if dry_run # exit before submission if specified as annotation was already validated
165167

166-
# check if there's already a job running using these parameters and exit if so
167-
job_params = ApplicationController.batch_api_client.format_command_line(
168-
study_file:, action: :differential_expression, user_metrics_uuid: user.metrics_uuid, params_object:
169-
)
170-
running = ApplicationController.batch_api_client.find_matching_jobs(
171-
params: job_params, job_states: BatchApiClient::RUNNING_STATES
172-
)
173-
if running.any?
174-
log_message "Found #{running.count} running DE jobs: #{running.map(&:name).join(', ')}"
175-
log_message "Matching these parameters: #{job_params.join(' ')}"
176-
log_message "Exiting without queuing new job"
177-
false
178-
elsif params_object.valid?
179-
# launch DE job
180-
job = IngestJob.new(study:, study_file:, user:, action: :differential_expression, params_object:)
181-
job.delay.push_remote_and_launch_ingest
182-
true
168+
if params_object.valid?
169+
# check if there's already a job running using these parameters and exit if so
170+
job_params = ApplicationController.batch_api_client.format_command_line(
171+
study_file:, action: :differential_expression, user_metrics_uuid: user.metrics_uuid, params_object:
172+
)
173+
running = ApplicationController.batch_api_client.find_matching_jobs(
174+
params: job_params, job_states: BatchApiClient::RUNNING_STATES
175+
)
176+
if running.any?
177+
log_message "Found #{running.count} running DE jobs: #{running.map(&:name).join(', ')}"
178+
log_message "Matching these parameters: #{job_params.join(' ')}"
179+
log_message "Exiting without queuing new job"
180+
false
181+
else
182+
# launch DE job
183+
job = IngestJob.new(study:, study_file:, user:, action: :differential_expression, params_object:)
184+
job.delay.push_remote_and_launch_ingest
185+
true
186+
end
183187
else
184-
raise ArgumentError, "job parameters failed to validate: #{params_object.errors.full_messages}"
188+
raise ArgumentError, "job parameters failed to validate: #{params_object.errors.full_messages.join(', ')}"
185189
end
186190
end
187191

@@ -377,12 +381,14 @@ def self.validate_annotation(cluster_group, study, annotation_name, annotation_s
377381
if !pairwise && cells_by_label.keys.count < 2
378382
raise ArgumentError, "#{identifier} does not have enough labels represented in #{cluster_group.name}"
379383
elsif pairwise
380-
missing = {
384+
missing = [group1, group2] - annotation[:values]
385+
raise ArgumentError, "#{annotation_name} does not contain '#{missing.join(', ')}'" if missing.any?
386+
cell_count = {
381387
"#{group1}" => cells_by_label[group1].count,
382388
"#{group2}" => cells_by_label[group2].count
383389
}.keep_if { |_, c| c < 2 }
384390
raise ArgumentError,
385-
"#{missing.keys.join(', ')} does not have enough cells represented in #{identifier}" if missing.any?
391+
"#{cell_count.keys.join(', ')} does not have enough cells represented in #{identifier}" if cell_count.any?
386392
end
387393
end
388394

@@ -451,4 +457,39 @@ def self.cluster_file_url(cluster_group)
451457
study_file.gs_url
452458
end
453459
end
460+
461+
# retrieve the weekly user quota value
462+
#
463+
# * *returns*
464+
# - (Integer)
465+
def self.get_weekly_user_quota
466+
config = AdminConfiguration.find_by(config_type: 'Weekly User DE Quota')
467+
config ? config.value.to_i : DEFAULT_USER_QUOTA
468+
end
469+
470+
# check if a user has exceeded their weekly quota
471+
#
472+
# * *params*
473+
# - +user+ (User) => user requesting DE job
474+
#
475+
# * *returns*
476+
# - (Boolean)
477+
def self.job_exceeds_quota?(user)
478+
user.weekly_de_quota.to_i >= get_weekly_user_quota
479+
end
480+
481+
# increment a given user's weekly quota
482+
#
483+
# * *params*
484+
# - +user+ (User) => user requesting DE job
485+
def self.increment_user_quota(user)
486+
current_quota = user.weekly_de_quota.to_i
487+
current_quota += 1
488+
user.update(weekly_de_quota: current_quota)
489+
end
490+
491+
# reset all user-requested DE quotas on a weekly basis
492+
def self.reset_all_user_quotas
493+
User.update_all(weekly_de_quota: 0)
494+
end
454495
end

app/models/admin_configuration.rb

+3-2
Original file line numberDiff line numberDiff line change
@@ -20,8 +20,9 @@ class AdminConfiguration
2020
API_NOTIFIER_NAME = 'API Health Check Notifier'.freeze
2121
INGEST_DOCKER_NAME = 'Ingest Pipeline Docker Image'.freeze
2222
NUMERIC_VALS = %w[byte kilobyte megabyte terabyte petabyte exabyte].freeze
23-
CONFIG_TYPES = [INGEST_DOCKER_NAME, 'Daily User Download Quota', 'Portal FireCloud User Group', 'TDR Snapshot IDs',
24-
'Reference Data Workspace', 'Read-Only Access Control', 'QA Dev Email', API_NOTIFIER_NAME].freeze
23+
CONFIG_TYPES = [INGEST_DOCKER_NAME, 'Daily User Download Quota', 'Weekly User DE Quota', 'Portal FireCloud User Group',
24+
'TDR Snapshot IDs', 'Reference Data Workspace', 'Read-Only Access Control', 'QA Dev Email',
25+
API_NOTIFIER_NAME].freeze
2526
ALL_CONFIG_TYPES = (CONFIG_TYPES.dup << FIRECLOUD_ACCESS_NAME).freeze
2627
VALUE_TYPES = %w[Numeric Boolean String].freeze
2728

app/models/ingest_job.rb

+5-1
Original file line numberDiff line numberDiff line change
@@ -1011,9 +1011,13 @@ def get_job_analytics
10111011
job_props.merge!(
10121012
{
10131013
numCells: cluster&.points,
1014-
numAnnotationValues: annotation[:values]&.size
1014+
numAnnotationValues: annotation[:values]&.size,
1015+
deType: params_object.de_type
10151016
}
10161017
)
1018+
if params_object.de_type == 'pairwise'
1019+
job_props.merge!( { pairwiseGroups: [params_object.group1, params_object.group2]})
1020+
end
10171021
when :image_pipeline
10181022
data_cache_perftime = params_object.data_cache_perftime
10191023
job_props.merge!(

app/models/user.rb

+1
Original file line numberDiff line numberDiff line change
@@ -87,6 +87,7 @@ def owned_by(user)
8787
field :admin, type: Boolean
8888
field :reporter, type: Boolean
8989
field :daily_download_quota, type: Integer, default: 0
90+
field :weekly_de_quota, type: Integer, default: 0 # limits number of user-requested DE jobs
9091
field :admin_email_delivery, type: Boolean, default: true
9192
field :registered_for_firecloud, type: Boolean, default: false
9293
# {

config/routes.rb

+1
Original file line numberDiff line numberDiff line change
@@ -87,6 +87,7 @@
8787
get 'studies/:accession', to: 'site#view_study', as: :site_study_view
8888
get 'studies/:accession/download', to: 'site#download_data', as: :site_study_download_data
8989
get 'studies/:accession/stream', to: 'site#stream_data', as: :site_study_stream_data
90+
post 'studies/:accession/differential_expression', to: 'site#submit_differential_expression', as: :site_study_submit_differential_expression
9091
get 'studies/:accession/renew_read_only_access_token', to: 'site#renew_read_only_access_token', as: :site_renew_read_only_access_token
9192
get 'renew_user_access_token', to: 'site#renew_user_access_token', as: :site_renew_user_access_token
9293

rails_startup.bash

+1
Original file line numberDiff line numberDiff line change
@@ -127,6 +127,7 @@ fi
127127

128128
echo "*** ADDING DAILY RESET OF USER DOWNLOAD QUOTAS ***"
129129
(crontab -u app -l ; echo "@daily . /home/app/.cron_env ; cd /home/app/webapp/; /home/app/webapp/bin/rails runner -e $PASSENGER_APP_ENV \"DownloadQuotaService.reset_all_quotas\" >> /home/app/webapp/log/cron_out.log 2>&1") | crontab -u app -
130+
(crontab -u app -l ; echo "@weekly . /home/app/.cron_env ; cd /home/app/webapp/; /home/app/webapp/bin/rails runner -e $PASSENGER_APP_ENV \"DifferentialExpressionService.reset_all_user_quotas\" >> /home/app/webapp/log/cron_out.log 2>&1") | crontab -u app -
130131
echo "*** COMPLETED ***"
131132

132133
echo "*** LOCALIZING USER ASSETS ***"

0 commit comments

Comments
 (0)