# Database Use Cases

## Test 1: Calculate Allele Frequency

In [None]:
with t AS  
      (  
      SELECT COUNT(DISTINCT subject_id) * 2 AS n_total FROM p7_staging.two_row_varid  
      ),  
   -- group variants in subset by position using var_id and  
   -- count number of times each variant occurs  
   vars AS  
      (  
        SELECT var_id, count(var_id) as var_count  
        FROM p7_staging.two_row_varid  
        GROUP BY var_id  
      )  
   -- divide the number of times each variant occurs  
   -- by the total number of samples  
SELECT vars.*, vars.var_count/t.n_total AS freq 
  FROM vars, t  

Results: 10 rows in 2 seconds

## Test 2: Extract all variants in Exon 5 of BRCA1 transcript.

In [None]:
-- create view with annotations for all brca1 genes  
create view p7_product.brca1 as   
select *   
from p7_product.dbnsfp_vars   
where gene_name LIKE '%BRCA1%'  
and chrom = '17'  
and pos_block = 41;  

Results: .04 seconds

### Find all Illumina Variants in BRCA1 exon 5

In [None]:
-- find all illumina variants in brca1 exon 5
select ill.subject_id, b.*
from p7_platform.wgs_illumina_variant ill, p7_product.brca1 b
where ill.chrom = b.chrom
and ill.pos = b.pos
and ill.ref = b.ref
and ill.alt = b.alt
and ill.chrom = '17'
and b.chrom = '17'
and b.exon_number = 5

Results:  4.72s  
View Creation + Query = 4.76 seconds  
Expected = 60 seconds  
Time under expected = 55.24  

## Test 3: Extract all PPC variants in BRCA2 with HGMD and ClinVar annotations

In [None]:
-- create table of all PPC BRCA2 variants with annotations
create table p7_product.ppc_brca2 as   
select *   
from p7_product.dbnsfp_vars   
where gene_name LIKE '%BRCA2%'  
and chrom = '13'  
and pos_block = 32
and ppc = 'nonsynonymous' or ppc = 'frameshift_nonsynonymous';  

-- find all ppc illumina variants in brca2 with clinvar annotations
select ill.subject_id, b.*
from p7_platform.wgs_illumina_variant ill, p7_product.ppc_brca2 b
where ill.chrom = b.chrom
and ill.pos = b.pos
and ill.ref = b.ref
and ill.alt = b.alt
and ill.chrom = '13'; 


In [None]:
Results: 

## Test 4: Find all variants in BRCA2 that are in ClinVar or HGMD.

In [70]:
-- create table with annotations for all brca2 genes  
create table p7_product.brca2 as   
select *   
from p7_product.dbnsfp_vars   
where gene_name LIKE '%BRCA2%'  
and chrom = '13'  
and pos_block = 32;  

.04s

-- find all illumina variants in brca2 with clinvar annotations
select ill.subject_id, b.*
from p7_platform.wgs_illumina_variant ill, p7_product.brca2 b
where ill.chrom = b.chrom
and ill.pos = b.pos
and ill.ref = b.ref
and ill.alt = b.alt
and ill.chrom = '13'
and (b.clin_sig = '4' or b.clin_sig = '5'); 



In [None]:
Results: 3.8 seconds