In [1]:
# Notebook parameters. Values here are for development only and
# will be overridden when running via snakemake and papermill.
contig = "2RL"
cohorts_analysis = "20240924"
analysis_version = "2025.02.07"
dask_scheduler = "single-threaded"

In [2]:
# Parameters
analysis_version = "2025.02.25"
min_cohort_size = 15
max_cohort_size = 100
sample_sets = [
    "3.0",
    "1237-VO-BJ-DJOGBENOU-VMF00050",
    "1237-VO-BJ-DJOGBENOU-VMF00067",
    "1244-VO-GH-YAWSON-VMF00051",
    "1245-VO-CI-CONSTANT-VMF00054",
    "1253-VO-TG-DJOGBENOU-VMF00052",
    "1178-VO-UG-LAWNICZAK-VMF00025",
    "1244-VO-GH-YAWSON-VMF00149",
    "barron-2019",
    "crawford-2016",
    "tennessen-2021",
    "bergey-2019",
    "campos-2021",
    "fontaine-2015-rebuild",
]
sample_query = "taxon in ['gambiae', 'coluzzii', 'arabiensis', 'bissau']"
contigs = ["2RL", "3RL", "X"]
cohorts_analysis = "20240924"
h12_calibration_contig = "3L"
h12_signal_detection_min_delta_aic = 1000
h12_signal_detection_min_stat_max = 0.1
h12_signal_detection_gflanks = [6]
dask_scheduler = "single-threaded"
alerts = ["01", "02", "03", "04", "05", "06", "07", "08", "09"]
contig = "X"


In [3]:
from pyprojroot import here

root = here()
%run -i {root}/workflow/common/scripts/setup.py
%run -i {root}/workflow/site/scripts/page-setup.py

# N.B., do not add the "remove-output" tag to this cell!!! If you do,
# the bokeh javascript libraries will not get loaded in the generated
# HTML page. The call to output_notebook() injects javascript in the
# cell output which triggers the bokeh javascript libraries to be loaded
# in the page.
output_notebook(hide_banner=True)

# Chromosome X

In [4]:
Markdown(
    """The plot below shows selection signals discovered in the major vector species *An. gambiae*, 
    *An. coluzzii* or *An. arabiensis*, all of which are members of the *Anopheles gambiae* species complex. 
    The reference genome used for these analyses is the AgamP4 PEST reference. Hover over a 
    signal for more information about the species, location, date and selection statistic in which the signal 
    was found. Click on a signal to see the underlying selection scan data."""
)

The plot below shows selection signals discovered in the major vector species *An. gambiae*, 
    *An. coluzzii* or *An. arabiensis*, all of which are members of the *Anopheles gambiae* species complex. 
    The reference genome used for these analyses is the AgamP4 PEST reference. Hover over a 
    signal for more information about the species, location, date and selection statistic in which the signal 
    was found. Click on a signal to see the underlying selection scan data.

In [5]:
df_signals = load_signals(contig=contig)

plot_signals(df=df_signals, contig=contig)

In [6]:
df_signals = df_signals[
    [
        "contig",
        "focus_pstart",
        "focus_pstop",
        "cohort_id",
        "cohort_label",
        "statistic",
        "delta_i",
    ]
]
df_signals = df_signals.assign(
    focal_region=df_signals["contig"]
    + " ( "
    + df_signals["focus_pstart"].apply(
        lambda x: "{:,}".format(
            x,
        )
    )
    + " - "
    + df_signals["focus_pstop"].apply(
        lambda x: "{:,}".format(
            x,
        )
    )
    + " )"
)


def make_clickable(url, name):
    return '<a href="{}" rel="noopener noreferrer" target="_blank">{}</a>'.format(
        url, name
    )


df_signals["url"] = "../cohort/" + df_signals["cohort_id"] + ".html"
df_signals["cohort_label"] = df_signals.apply(
    lambda x: make_clickable(x["url"], x["cohort_label"]), axis=1
)
df_signals[["focal_region", "cohort_label", "statistic", "delta_i"]].rename(
    columns={
        "focal_region": "Focal Region",
        "cohort_label": "Cohort Label",
        "statistic": "Statistic",
        "delta_i": "Delta i",
    }
).style.hide(axis="index")

Focal Region,Cohort Label,Statistic,Delta i
"X ( 9,472,757 - 9,794,544 )",Ghana / Adansi South / gambiae / 2018 / Q4,H12,2460
"X ( 9,108,215 - 9,441,407 )",Cote d'Ivoire / Sud-Comoe / gambiae / 2017 / Q3,H12,1941
"X ( 9,113,524 - 9,445,221 )",Ghana / La-Nkwantanang-Madina / gambiae / 2017 / Q4,H12,1600
"X ( 8,773,284 - 8,825,105 )",Benin / Avrankou / coluzzii / 2017 / Q3,H12,1397
"X ( 9,126,143 - 9,337,501 )",Cote d'Ivoire / Agneby-Tiassa / coluzzii / 2012,H12,2286
"X ( 9,156,295 - 9,363,702 )",Burkina Faso / Houet / gambiae / 2014 / Q3,H12,1961
"X ( 9,225,417 - 9,256,905 )",Burkina Faso / Houet / gambiae / 2012 / Q3,H12,3149
"X ( 9,190,961 - 9,232,268 )",Burkina Faso / Comoe / coluzzii / 2012,H12,2732
"X ( 9,227,785 - 9,254,301 )","Gambia, The / Lower Fuladu West / coluzzii / 2012 / Q4",H12,3498
"X ( 9,216,779 - 9,243,334 )",Burkina Faso / Houet / coluzzii / 2012 / Q3,H12,3573
