Skip to content

Commit

Permalink
no need for a gcloud install at runtime
Browse files Browse the repository at this point in the history
  • Loading branch information
MattWellie committed May 24, 2024
1 parent ce03f06 commit 4394227
Showing 1 changed file with 4 additions and 2 deletions.
6 changes: 4 additions & 2 deletions cpg_workflows/jobs/gcnv.py
Original file line number Diff line number Diff line change
Expand Up @@ -322,9 +322,11 @@ def postprocess_calls(
model_shard_args = ''
calls_shard_args = ''

# forced ordering here just in case
# import with hail batch instead, then unpack in the container. No need to depend on a gcloud/gsutil install
# https://batch.hail.populationgenomics.org.au/batches/454143/jobs/1
for name, path in [(shard, shard_paths[shard]) for shard in shard_basenames()]:
gcp_related_commands.append(f'gsutil cat {path} | tar -xz -C $BATCH_TMPDIR/inputs')
shard_tar = get_batch().read_input(str(path))
gcp_related_commands.append(f'tar -xzf {shard_tar} -C $BATCH_TMPDIR/inputs')
model_shard_args += f' --model-shard-path $BATCH_TMPDIR/inputs/{name}-model'
calls_shard_args += f' --calls-shard-path $BATCH_TMPDIR/inputs/{name}-calls'

Expand Down

0 comments on commit 4394227

Please sign in to comment.