In [None]:
import malariagen_data

ag3 = malariagen_data.Ag3(
    "simplecache::gs://vo_agam_release_master_us_central1",
    simplecache=dict(cache_storage="../gcs_cache"),
)
ag3

In [None]:
import malariagen_data

af1 = malariagen_data.Af1(
    "simplecache::gs://vo_afun_release_master_us_central1",
    simplecache=dict(cache_storage="../gcs_cache"),
)
af1

## Gene CNV frequencies

In [None]:
ds = ag3.gene_cnv_frequencies_advanced(
    region="2R:28,450,000-28,510,000",
    area_by="admin1_iso",
    period_by="year",
    sample_sets=["AG1000G-BF-A", "AG1000G-BF-B"],
    sample_query="taxon in ['coluzzii', 'gambiae']",
    min_cohort_size=10,
)
ds

In [None]:
ag3.plot_frequencies_time_series(ds, height=500, width=1000)

In [None]:
ds = ag3.gene_cnv_frequencies_advanced(
    region="2R:28,450,000-28,510,000",
    area_by="admin1_iso",
    period_by="year",
    sample_sets="3.0",
    min_cohort_size=10,
)
ds

In [None]:
ag3.plot_frequencies_interactive_map(ds)

## Amino acid change frequencies

In [None]:
ds = ag3.aa_allele_frequencies_advanced(
    transcript="AGAP004707-RD",
    area_by="admin1_iso",
    period_by="year",
    sample_sets=["AG1000G-BF-A", "AG1000G-BF-B"],
    sample_query="sex_call == 'F' and taxon == 'coluzzii'",
    min_cohort_size=10,
    variant_query="max_af > 0.05",
)
ds

In [None]:
ag3.plot_frequencies_time_series(ds, height=400, width=600)

In [None]:
ds = ag3.aa_allele_frequencies_advanced(
    transcript="AGAP004707-RD",
    area_by="admin1_iso",
    period_by="year",
    sample_sets="3.0",
    min_cohort_size=10,
    variant_query="max_af > 0.05",
)
ds

In [None]:
ag3.plot_frequencies_interactive_map(ds)

In [None]:
af1.sample_sets()

In [None]:
af1.genome_features()

In [None]:
ds = af1.aa_allele_frequencies_advanced(
    transcript="LOC125767311_t1",
    area_by="admin1_iso",
    period_by="year",
    sample_sets="1.0",
    min_cohort_size=10,
    variant_query="max_af > 0.05",
)
ds

In [None]:
af1.plot_frequencies_interactive_map(ds)

## SNP allele frequencies

In [None]:
ds = ag3.snp_allele_frequencies_advanced(
    transcript="AGAP004707-RD",
    area_by="admin1_iso",
    period_by="year",
    sample_sets=["AG1000G-BF-A", "AG1000G-BF-B", "AG1000G-UG", "AG1000G-TZ"],
    sample_query="taxon in ['gambiae', 'coluzzii']",
    min_cohort_size=10,
    drop_invariant=True,
    variant_query="max_af > 0.05 and effect == 'NON_SYNONYMOUS_CODING'",
    site_mask=None,
    nobs_mode="called",
    ci_method="wilson",
)
ds

In [None]:
ag3.plot_frequencies_time_series(ds, height=900, width=900)

In [None]:
ds = ag3.snp_allele_frequencies_advanced(
    transcript="AGAP004707-RD",
    area_by="admin1_iso",
    period_by="month",
    sample_query="country == 'Burkina Faso' and year > 2010",
    variant_query="max_af > 0.05 and effect == 'NON_SYNONYMOUS_CODING'",
    min_cohort_size=5,
    sample_sets="3.0",
)
ds

In [None]:
ag3.plot_frequencies_time_series(ds, height=400, width=800)

In [None]:
ds = ag3.snp_allele_frequencies_advanced(
    transcript="AGAP004707-RD",
    area_by="admin1_iso",
    period_by="year",
    variant_query="max_af > 0.05 and effect == 'NON_SYNONYMOUS_CODING'",
    min_cohort_size=10,
    sample_sets="3.0",
)
ds

In [None]:
ag3.plot_frequencies_interactive_map(ds)

In [None]:
ds = af1.snp_allele_frequencies_advanced(
    transcript="LOC125767311_t1",
    area_by="admin1_iso",
    period_by="year",
    sample_sets="1.0",
    min_cohort_size=10,
    variant_query="max_af > 0.05 and effect == 'NON_SYNONYMOUS_CODING'",
)
ds

In [None]:
af1.plot_frequencies_interactive_map(ds)