In [None]:
import os
import numpy as np
import pandas as pd
import pandas_profiling
import plotnine
from plotnine import *  # Provides a ggplot-like interface to matplotlib.
from IPython.display import display

In [None]:
%%bash --out R2_JOB_ID2
source ~/aou_dsub.bash

pops="EUR META"

while IFS=$'\t' read -r ukb_pheno aou_pheno; do

for pop in ${pops};do
 aou_dsub \
  --image gcr.io/ukbb-diversepops-neale/yw-prs-r:test \
  --min-cores 4 \
  --min-ram 10 \
  --disk-size 10 \
  --boot-disk-size 10 \
  --name "prs_accuracy" \
  --preemptible \
  --input PRSFILE="${WORKSPACE_BUCKET}/panukbb/profiles/combined/${ukb_pheno}_PRS_CS_${pop}.sscore" \
  --env POPFILE="NULL" --env K="NULL" \
  --input PHENOFILE="${WORKSPACE_BUCKET}/panukbb/phenos/0523_panukbb_binary_phenotypes.txt.gz" \
  --env PHENO="${aou_pheno}" \
  --input COVFILE="${WORKSPACE_BUCKET}/panukbb/phenos/0523_panukbb_binary_phenotypes.txt.gz" \
  --env COVS="age,sex_at_birth" --env PC_NUMBERS="PC1,PC2,PC3,PC4,PC5,PC6,PC7,PC8,PC9,PC10" \
  --input PCFILE="${WORKSPACE_BUCKET}/panukbb/phenos/0523_panukbb_binary_phenotypes.txt.gz" \
  --env COHORT="panUKBB" --env LDREF="1KG" \
  --output OUT="${WORKSPACE_BUCKET}/panukbb/outputs/${ukb_pheno}_PRS_CS_${pop}.txt" \
  --label "bath=prscs_binary_0507" \
  --script 'cal_accuracy_binary.R' 
done
done  < phenos/pheno_list_binary.txt

In [None]:
%%bash --out R2_JOB_ID3
source ~/aou_dsub.bash

pops="EUR META"

while IFS=$'\t' read -r ukb_pheno aou_pheno; do

for pop in ${pops};do
for seq in {1..10};do
 aou_dsub \
  --image gcr.io/ukbb-diversepops-neale/yw-prs-r:test \
  --min-cores 4 \
  --min-ram 10 \
  --disk-size 10 \
  --boot-disk-size 10 \
  --name "prs_accuracy" \
  --preemptible \
  --input PRSFILE="${WORKSPACE_BUCKET}/panukbb/profiles/combined/${ukb_pheno}_S${seq}_PT_${pop}.sscore" \
  --env POPFILE="NULL" --env K="NULL" \
  --input PHENOFILE="${WORKSPACE_BUCKET}/panukbb/phenos/0523_panukbb_binary_phenotypes.txt.gz" \
  --env PHENO="${aou_pheno}" \
  --input COVFILE="${WORKSPACE_BUCKET}/panukbb/phenos/0523_panukbb_binary_phenotypes.txt.gz" \
  --env COVS="age,sex_at_birth" --env PC_NUMBERS="PC1,PC2,PC3,PC4,PC5,PC6,PC7,PC8,PC9,PC10" \
  --input PCFILE="${WORKSPACE_BUCKET}/panukbb/phenos/0523_panukbb_binary_phenotypes.txt.gz" \
  --env COHORT="panUKBB" --env LDREF="1KG" \
  --output OUT="${WORKSPACE_BUCKET}/panukbb/outputs/${ukb_pheno}_S${seq}_PT_${pop}.txt" \
  --label "bath=pt_binary_0507" \
  --script 'cal_accuracy_binary.R' 
done
done
done  < phenos/pheno_list_binary.txt

In [None]:
%%bash --out R2_JOB_ID
source ~/aou_dsub.bash

while IFS=$'\t' read -r ukb_pheno aou_pheno; do
    # do something with the columns
if gsutil -q stat ${WORKSPACE_BUCKET}/panukbb/profiles/combined/${ukb_pheno}_PRScsx_v2_META.sscore   
then
echo "${ukb_pheno}"

outf="/home/jupyter/panukbb/outputs/binary/${ukb_pheno}_PRScsx_v2_META.txt"

if [[ ! -f "${outf}" ]];then
aou_dsub \
  --image gcr.io/ukbb-diversepops-neale/yw-prs-r:test \
  --min-cores 1 \
  --min-ram 10 \
  --disk-size 10 \
  --boot-disk-size 10 \
  --name "prs_accuracy" \
  --input PRSFILE="${WORKSPACE_BUCKET}/panukbb/profiles/combined/${ukb_pheno}_PRScsx_v2_META.sscore" \
  --input POPFILE="${WORKSPACE_BUCKET}/panukbb/data/test_ids.list" \
  --env K="NULL" \
  --input PHENOFILE="gs://fc-secure-0a267fcd-4f74-4643-b7f3-d0cf2e548bcc/panukbb/phenos/0523_panukbb_binary_phenotypes.txt.gz" \
  --env PHENO="${aou_pheno}" \
  --input COVFILE="gs://fc-secure-0a267fcd-4f74-4643-b7f3-d0cf2e548bcc/panukbb/phenos/0523_panukbb_binary_phenotypes.txt.gz" \
  --env COVS="age,sex_at_birth" --env PC_NUMBERS="PC1,PC2,PC3,PC4,PC5,PC6,PC7,PC8,PC9,PC10" \
  --input PCFILE="gs://fc-secure-0a267fcd-4f74-4643-b7f3-d0cf2e548bcc/panukbb/phenos/0523_panukbb_binary_phenotypes.txt.gz" \
  --env COHORT="panUKBB_AoU" --env LDREF="1KG" \
  --output OUT="${WORKSPACE_BUCKET}/panukbb/outputs/${ukb_pheno}_PRScsx_v2_META.txt" \
  --label "batch=prscsx_binary_1112" \
  --script '/home/jupyter/panukbb/scripts/cal_accuracy_binary.R'
fi

else

echo "prsfile not exists"

fi

done  < /home/jupyter/panukbb/phenos/pheno_list_binary.txt