In [2]:
import pandas as pd
import altair as alt
alt.data_transformers.enable("vegafusion")

# Load your data
func_data_ann = pd.read_csv('../results/annotated_summary_csvs/entry_293T-Mxra8_C636_293T-TIM1_Mxra8-binding_annotated.csv')
func_data_ann = func_data_ann[func_data_ann['domain'].notnull()]

In [3]:
# Define custom colors for each region
colors = {
    'E3': '#E198B5',
    'E2': '#E198B5',
    '6K': '#E198B5',
    'E1': '#E198B5',
}
order = ['E3', 'E2', '6K', 'E1']

# Jittered scatter points
points = alt.Chart(func_data_ann).mark_circle(size=20, opacity=0.2).encode(
    y=alt.Y("region:N", sort=order, title=None),
    x=alt.X("entry in 293T_Mxra8 cells:Q", title=["Mutation effect on cell entry"]),
    yOffset="jitter:Q",
    color=alt.Color("region:N", scale=alt.Scale(domain=list(colors.keys()), range=list(colors.values())), legend=None),
    tooltip=['sequential_site', 'wildtype', 'mutant', 'entry in 293T_Mxra8 cells']
).transform_calculate(
    jitter="sqrt(-2*log(random()))*cos(2*PI*random())"
)

# Black median tick per region (adjusted to correct column name)
median_line = alt.Chart(func_data_ann).mark_tick(
    color='black',
    thickness=3,
    size=25
).encode(
    y=alt.Y('region:N', sort=order),
    x=alt.X('median(entry in 293T_Mxra8 cells):Q')
)

# Vertical reference line at x=0
vline = alt.Chart(pd.DataFrame({'x': [0]})).mark_rule(
    color='black',
    size=1.25,
    opacity=1.0,
    strokeDash=[6, 6]
).encode(
    x='x:Q'
)

# Combine the layers
chart = alt.layer(
    points,
    median_line,
    vline
).properties(
    height=200,
    width=200,
    title=alt.TitleParams(
        text='CHIKV E proteins',
        anchor='middle',
        fontSize=16,
        fontWeight='bold',
        font='Arial'
    )
)
# Configure axis font (outside of `.properties(...)`)
chart = chart.configure_axis(
    labelFont='Arial',
    labelFontSize=14,
    titleFont='Arial',
    titleFontSize=14,
    titleFontWeight='normal'
)
chart.show()


In [4]:
# Define custom colors for each region
colors = {
    'E3': '#F28D6F',
    'E2-n-linker': '#F28D6F',
    'E2-domain a': '#F28D6F',
    'E2-arch1': '#F28D6F',
    'E2-domain b': '#F28D6F',
    'E2-arch2': '#F28D6F',
    'E2-domain c': '#F28D6F',
    'E2-stem': '#F28D6F',
    'E2-transmembrane': '#F28D6F',
    'E2-cytoplasmic': '#F28D6F',
    '6K': '#F28D6F',
    'E1-domain I': '#F28D6F',
    'E1-domain II': '#F28D6F',
    'E1-fusion loop': '#F28D6F',
    'E1-domain III': '#F28D6F',
    'E1-stem': '#F28D6F',
    'E1-transmembrane': '#F28D6F',
    'E1-cytoplasmic': '#F28D6F',
}
order = ['E3', 'E2-n-linker', 'E2-domain a', 'E2-arch1', 'E2-domain b', 'E2-arch2', 'E2-domain c', 'E2-stem', 'E2-transmembrane', 'E2-cytoplasmic', '6K', 'E1-domain I', 'E1-domain II', 'E1-fusion loop','E1-domain III', 'E1-stem', 'E1-transmembrane', 'E1-cytoplasmic']

# Jittered scatter points
points = alt.Chart(func_data_ann).mark_circle(size=20, opacity=0.3).encode(
    y=alt.Y("domain:N", sort=order, title=None),
    x=alt.X("entry in 293T_Mxra8 cells:Q", title=["Mutation effect on cell entry"]),
    yOffset="jitter:Q",
    color=alt.Color("domain:N", scale=alt.Scale(domain=list(colors.keys()), range=list(colors.values())), legend=None),
    tooltip=['sequential_site', 'wildtype', 'mutant', 'entry in 293T_Mxra8 cells']
).transform_calculate(
    jitter="sqrt(-2*log(random()))*cos(2*PI*random())"
)

# Black median tick per domain (adjusted to correct column name)
median_line = alt.Chart(func_data_ann).mark_tick(
    color='black',
    thickness=3,
    size=12
).encode(
    y=alt.Y('domain:N', sort=order),
    x=alt.X('median(entry in 293T_Mxra8 cells):Q')
)

# Vertical reference line at x=0
vline = alt.Chart(pd.DataFrame({'x': [0]})).mark_rule(
    color='black',
    size=1.25,
    opacity=1.0,
    strokeDash=[6, 6]
).encode(
    x='x:Q'
)

# Combine the layers
chart = alt.layer(
    points,
    median_line,
    vline
).properties(
    height=300,
    width=200,
    title=alt.TitleParams(
        text='CHIKV E domains',
        anchor='middle',
        fontSize=16,
        fontWeight='bold',
        font='Arial'
    )
)
# Configure axis font (outside of `.properties(...)`)
chart = chart.configure_axis(
    labelFont='Arial',
    labelFontSize=12,
    titleFont='Arial',
    titleFontSize=14,
    titleFontWeight='normal'
)
chart.show()


In [10]:
# Define custom colors for each region
colors = {
    'no': '#023FA5',
    'wrapped': '#023FA5',
    'intraspike': '#023FA5',
    'interspike': '#023FA5',
}
order = ['no', 'wrapped', 'intraspike', 'interspike']

# Jittered scatter points
points = alt.Chart(func_data_ann).mark_circle(size=20, opacity=0.2).encode(
    y=alt.Y("contacts:N", sort=order, title=None),
    x=alt.X("entry in 293T_Mxra8 cells:Q", title=["Mutation effect on cell entry"]),
    yOffset="jitter:Q",
    color=alt.Color("contacts:N", scale=alt.Scale(domain=list(colors.keys()), range=list(colors.values())), legend=None),
    tooltip=['sequential_site', 'wildtype', 'mutant', 'entry in 293T_Mxra8 cells']
).transform_calculate(
    jitter="sqrt(-2*log(random()))*cos(2*PI*random())"
)

# Black median tick per region (adjusted to correct column name)
median_line = alt.Chart(func_data_ann).mark_tick(
    color='black',
    thickness=3,
    size=25
).encode(
    y=alt.Y('contacts:N', sort=order),
    x=alt.X('median(entry in 293T_Mxra8 cells):Q')
)

# Vertical reference line at x=0
vline = alt.Chart(pd.DataFrame({'x': [0]})).mark_rule(
    color='black',
    size=1.25,
    opacity=1.0,
    strokeDash=[6, 6]
).encode(
    x='x:Q'
)

# Combine the layers
chart = alt.layer(
    points,
    median_line,
    vline
).properties(
    height=200,
    width=200,
    title=alt.TitleParams(
        text='Mxra8 contacts',
        anchor='middle',
        fontSize=16,
        fontWeight='bold',
        font='Arial'
    )
)
# Configure axis font (outside of `.properties(...)`)
chart = chart.configure_axis(
    labelFont='Arial',
    labelFontSize=14,
    titleFont='Arial',
    titleFontSize=14,
    titleFontWeight='normal'
)
chart.show()
