# Notebook to process mutations from MARDy 2.0

## Import libraries

In [1]:
import pandas as pd
import numpy as np

## Parse dataframe of FKS mutations of MARDy 2.0

In [2]:
FKS = pd.read_excel('fks_data_long.xlsx')
FKS

Unnamed: 0,first author name,journal,year,pubmedid,species,gene or protein name,accession number for protein name,source,drug,mutation,...,excel,original drug,original protein,original mutation,original origin,original MIC,ortho_homolog,wt_AA,position,alt_AA
0,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,18443110,Saccharomyces cerevisiae,Fks1,AAC48981,,Caspofungin,P647A,...,CB,caspofungin,FKS1,P647A,Lab,,Fks1,P,647.0,A
1,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,18443110,Saccharomyces cerevisiae,Fks1,AAC48981,,Micafungin,P647A,...,CB,micafungin,FKS1,P647A,Lab,,Fks1,P,647.0,A
2,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,18443110,Saccharomyces cerevisiae,Fks1,AAC48981,,Anidulafungin,P647A,...,CB,anidulafungin,FKS1,P647A,Lab,,Fks1,P,647.0,A
3,Ohyma,Antimicrobial Agents and Chemotherapy,2004,14693557,Saccharomyces cerevisiae,Fks1,,,Arbocandin C,N470K,...,CB,Arbocandin C,fks1,N470K,Lab,,Fks1,N,470.0,K
4,Ohyma,Antimicrobial Agents and Chemotherapy,2004,14693557,Saccharomyces cerevisiae,Fks1,,,Arbocandin C,L642S,...,CB,Arbocandin C,fks1,L642S,Lab,,Fks1,L,642.0,S
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1271,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2010,20145084,Candida albicans,Fks1,,,Caspofungin,S645P,...,RS2,caspofungin,FKS1,S645P,,8 ug/mL,Fks1,S,645.0,P
1272,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2010,20145084,Candida albicans,Fks1,,,Micafungin,S645P,...,RS2,micafungin,FKS1,S645P,,4 ug/mL,Fks1,S,645.0,P
1273,Cleary,Antimicrobial Agents and Chemotherapy,2008,18378714,Candida glabrata,Fks1,,,Anidulafungin,D632E,...,RS2,anidulafungin,FKS1,D632E,,>2 ug/mL,Fks1,D,632.0,E
1274,Cleary,Antimicrobial Agents and Chemotherapy,2008,18378714,Candida glabrata,Fks1,,,Caspofungin,D632E,...,RS2,caspofungin,FKS1,D632E,,>2 ug/mL,Fks1,D,632.0,E


Note: in the dataframe, there still appears to be duplicate entries due to two curators

In [3]:
FKS.columns

Index(['first author name', 'journal', 'year', 'pubmedid', 'species',
       'gene or protein name', 'accession number for protein name', 'source',
       'drug', 'mutation', 'degree of evidence', 'MIC', 'strain_ID',
       'strain origin if available', 'curator', 'notes', 'excel',
       'original drug', 'original protein', 'original mutation',
       'original origin', 'original MIC', 'ortho_homolog', 'wt_AA', 'position',
       'alt_AA'],
      dtype='object')

In [4]:
FKS['gene or protein name'].unique()

array(['Fks1', 'Fks2', 'Fks', 'Fks1/2', 'Fks1 or 2', 'Fks1 or Fks2'],
      dtype=object)

In [5]:
FKS.drug.unique()

array(['Caspofungin', 'Micafungin', 'Anidulafungin', 'Arbocandin C',
       '5-fluorocytosine', 'Posaconazole', 'Voriconazole', 'Itraconazole',
       'Fluconazole', 'Amphotericin B', 'CD101', 'Echinocandin',
       'Isavuconazole', 'Scy-078'], dtype=object)

In [6]:
print(FKS['degree of evidence'].unique())

[ 2.  1.  8. -8. -1.  4.  7.]


In [20]:
FKS_filtered = FKS[(FKS.drug.isin(['Caspofungin', 'Micafungin', 'Anidulafungin']))
                   & (FKS['gene or protein name'] != 'Fks2')
                   #& (FKS['degree of evidence'].isin(np.arange(-4,5)))
                  ]
FKS_filtered

Unnamed: 0,first author name,journal,year,pubmedid,species,gene or protein name,accession number for protein name,source,drug,mutation,...,excel,original drug,original protein,original mutation,original origin,original MIC,ortho_homolog,wt_AA,position,alt_AA
0,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,18443110,Saccharomyces cerevisiae,Fks1,AAC48981,,Caspofungin,P647A,...,CB,caspofungin,FKS1,P647A,Lab,,Fks1,P,647.0,A
1,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,18443110,Saccharomyces cerevisiae,Fks1,AAC48981,,Micafungin,P647A,...,CB,micafungin,FKS1,P647A,Lab,,Fks1,P,647.0,A
2,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,18443110,Saccharomyces cerevisiae,Fks1,AAC48981,,Anidulafungin,P647A,...,CB,anidulafungin,FKS1,P647A,Lab,,Fks1,P,647.0,A
6,Zhu,Journal of Clinical Microbiology,2023,36975998,Candida auris,Fks1,,,Anidulafungin,S639Y,...,CB,Anidulafungin,Fks1,S639Y,Clinical,,Fks1,S,639.0,Y
7,Zhu,Journal of Clinical Microbiology,2023,36975998,Candida auris,Fks1,,,Anidulafungin,S639F,...,CB,Anidulafungin,Fks1,S639F,Clinical,,Fks1,S,639.0,F
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1271,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2010,20145084,Candida albicans,Fks1,,,Caspofungin,S645P,...,RS2,caspofungin,FKS1,S645P,,8 ug/mL,Fks1,S,645.0,P
1272,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2010,20145084,Candida albicans,Fks1,,,Micafungin,S645P,...,RS2,micafungin,FKS1,S645P,,4 ug/mL,Fks1,S,645.0,P
1273,Cleary,Antimicrobial Agents and Chemotherapy,2008,18378714,Candida glabrata,Fks1,,,Anidulafungin,D632E,...,RS2,anidulafungin,FKS1,D632E,,>2 ug/mL,Fks1,D,632.0,E
1274,Cleary,Antimicrobial Agents and Chemotherapy,2008,18378714,Candida glabrata,Fks1,,,Caspofungin,D632E,...,RS2,caspofungin,FKS1,D632E,,>2 ug/mL,Fks1,D,632.0,E


In [21]:
print(FKS_filtered.species.unique())

['Saccharomyces cerevisiae' 'Candida auris' 'Candida glabrata'
 'Candida albicans' 'Candida krusei' 'Candida tropicalis'
 'Aspergillus fumigatus' 'Candida dubliniensis' 'Candida kefyr'
 'Candida lusitaniae' 'Candida parapsilosis' 'Candida metapsilosis'
 'Pichia kudriavzevii' 'Nasakeomyces glabrata']


In [22]:
FKS_filtered.replace({'species':{'Nasakeomyces glabrata': 'Candida glabrata',
                                                'Pichia kudriavzevii': 'Candida krusei'
                                               }}, inplace=True)
print(FKS_filtered.species.unique())

['Saccharomyces cerevisiae' 'Candida auris' 'Candida glabrata'
 'Candida albicans' 'Candida krusei' 'Candida tropicalis'
 'Aspergillus fumigatus' 'Candida dubliniensis' 'Candida kefyr'
 'Candida lusitaniae' 'Candida parapsilosis' 'Candida metapsilosis']


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  FKS_filtered.replace({'species':{'Nasakeomyces glabrata': 'Candida glabrata',


## Import dataframe of aligned positions

In [23]:
df_pos = pd.read_excel('fks_positions.xlsx', index_col=0, header=[0,1,2])
df_pos

Unnamed: 0_level_0,Ungapped position,Ungapped position,Ungapped position,Ungapped position,Ungapped position,Ungapped position,Ungapped position,Ungapped position,Ungapped position,Ungapped position,...,aa,aa,aa,aa,aa,aa,aa,aa,aa,aa
species,Candida krusei (Pichia kudriavzevii),Scedosporium apiospermum,Saccharomyces cerevisiae,Microsporum canis,Saccharomyces cerevisiae,Candida glabrata,Fusarium verticillioides,Magnaporthe oryzae,Pneumocystis carinii,Candida glabrata,...,Madurella mycetomatis,Candida tropicalis,Cryptococcus neoformans,Paracoccidioides lutzii,Candida lusitaniae (Clavispora lusitaniae),Paracoccidioides brasiliensis,Aspergillus flavus,Pseudocercospora fijiensis,Histoplasma capsulatum,Aspergillus oryzae
gene_name,FKS1,FKS1,FKS2,FKS1,FKS1,FKS2,FKS1,FKS1,FKS1,FKS1,...,FKS1,FKS1,FKS1,FKS1,FKS1,FKS1,FKS1,FKS1,FKS1,FKS1
Alignment position,Unnamed: 1_level_3,Unnamed: 2_level_3,Unnamed: 3_level_3,Unnamed: 4_level_3,Unnamed: 5_level_3,Unnamed: 6_level_3,Unnamed: 7_level_3,Unnamed: 8_level_3,Unnamed: 9_level_3,Unnamed: 10_level_3,Unnamed: 11_level_3,Unnamed: 12_level_3,Unnamed: 13_level_3,Unnamed: 14_level_3,Unnamed: 15_level_3,Unnamed: 16_level_3,Unnamed: 17_level_3,Unnamed: 18_level_3,Unnamed: 19_level_3,Unnamed: 20_level_3,Unnamed: 21_level_3
1,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,...,M,M,M,M,M,M,M,M,M,M
2,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,2.0,...,S,V,S,S,S,S,S,C,S,S
3,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,3.0,...,G,-,Y,A,Y,A,G,R,A,G
4,,,,,,,,,,,...,-,-,-,-,-,-,-,S,-,-
5,,,,,,,,,,,...,-,-,-,-,-,-,-,F,-,-
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2412,1882.0,1883.0,1892.0,1915.0,1873.0,1894.0,1938.0,1913.0,1945.0,1860.0,...,A,N,N,N,S,H,S,L,A,S
2413,1883.0,1884.0,1893.0,1916.0,1874.0,1895.0,1939.0,1914.0,1946.0,1861.0,...,D,P,G,A,K,A,A,Y,R,A
2414,,,,,,,,,,,...,-,-,-,-,-,-,-,-,-,-
2415,1884.0,1885.0,1894.0,1917.0,1875.0,1896.0,1940.0,1915.0,1947.0,1862.0,...,R,-,V,R,D,R,T,G,L,T


In [24]:
species_from_df_pos = set([x[0] for x in df_pos['Ungapped position'].columns])
species_of_interest = [x for x in species_from_df_pos if x.split('(')[0].rstrip() in FKS_filtered.species.unique()]
print(species_of_interest)

['Candida kefyr (Kluyveromyces marxianus)', 'Aspergillus fumigatus', 'Candida lusitaniae (Clavispora lusitaniae)', 'Saccharomyces cerevisiae', 'Candida glabrata', 'Candida albicans', 'Candida dubliniensis', 'Candida tropicalis', 'Candida krusei (Pichia kudriavzevii)', 'Candida parapsilosis', 'Candida auris', 'Candida metapsilosis']


In [25]:
df_pos.rename(columns={'Candida lusitaniae (Clavispora lusitaniae)': 'Candida lusitaniae',
                       'Candida kefyr (Kluyveromyces marxianus)': 'Candida kefyr',
                       'Candida krusei (Pichia kudriavzevii)': 'Candida krusei'
                      }, inplace=True)

In [26]:
def update_position(dataframe, df_positions):
    for _, row in dataframe.iterrows():
        position = float(row['position'])
        species = row['species']
        
        # Retrieve equivalent of position in the Scer FKS1 sequence
        pos_cerevisiae = df_positions.loc[
            df_positions[('Ungapped position', species, 'FKS1')] == position,
            ('Ungapped position', 'Saccharomyces cerevisiae', 'FKS1')].iloc[0]
        
        # Retrieve equivalent of WT residue in the Scer Fks1 sequence
        aa_cerevisiae = df_positions.loc[
            df_positions[('Ungapped position', species, 'FKS1')] == position,
            ('aa', 'Saccharomyces cerevisiae', 'FKS1')].iloc[0]
        
        # Add columns directly to specified dataframe
        dataframe.at[_, 'pos_cerevisiae'] = pos_cerevisiae
        dataframe.at[_, 'aa_cerevisiae'] = aa_cerevisiae

In [27]:
update_position(FKS_filtered, df_pos)

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  dataframe.at[_, 'pos_cerevisiae'] = pos_cerevisiae
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  dataframe.at[_, 'aa_cerevisiae'] = aa_cerevisiae


In [35]:
FKS_filtered['mutation_cerevisiae'] = FKS_filtered.apply(lambda row: row.aa_cerevisiae + str(int(row.pos_cerevisiae)) + row.alt_AA if not np.isnan(row.pos_cerevisiae) else np.nan, axis=1)
FKS_filtered

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  FKS_filtered['mutation_cerevisiae'] = FKS_filtered.apply(lambda row: row.aa_cerevisiae + str(int(row.pos_cerevisiae)) + row.alt_AA if not np.isnan(row.pos_cerevisiae) else np.nan, axis=1)


Unnamed: 0,first author name,journal,year,pubmedid,species,gene or protein name,accession number for protein name,source,drug,mutation,...,original mutation,original origin,original MIC,ortho_homolog,wt_AA,position,alt_AA,pos_cerevisiae,aa_cerevisiae,mutation_cerevisiae
0,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,18443110,Saccharomyces cerevisiae,Fks1,AAC48981,,Caspofungin,P647A,...,P647A,Lab,,Fks1,P,647.0,A,647.0,P,P647A
1,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,18443110,Saccharomyces cerevisiae,Fks1,AAC48981,,Micafungin,P647A,...,P647A,Lab,,Fks1,P,647.0,A,647.0,P,P647A
2,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,18443110,Saccharomyces cerevisiae,Fks1,AAC48981,,Anidulafungin,P647A,...,P647A,Lab,,Fks1,P,647.0,A,647.0,P,P647A
6,Zhu,Journal of Clinical Microbiology,2023,36975998,Candida auris,Fks1,,,Anidulafungin,S639Y,...,S639Y,Clinical,,Fks1,S,639.0,Y,643.0,S,S643Y
7,Zhu,Journal of Clinical Microbiology,2023,36975998,Candida auris,Fks1,,,Anidulafungin,S639F,...,S639F,Clinical,,Fks1,S,639.0,F,643.0,S,S643F
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1271,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2010,20145084,Candida albicans,Fks1,,,Caspofungin,S645P,...,S645P,,8 ug/mL,Fks1,S,645.0,P,643.0,S,S643P
1272,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2010,20145084,Candida albicans,Fks1,,,Micafungin,S645P,...,S645P,,4 ug/mL,Fks1,S,645.0,P,643.0,S,S643P
1273,Cleary,Antimicrobial Agents and Chemotherapy,2008,18378714,Candida glabrata,Fks1,,,Anidulafungin,D632E,...,D632E,,>2 ug/mL,Fks1,D,632.0,E,646.0,D,D646E
1274,Cleary,Antimicrobial Agents and Chemotherapy,2008,18378714,Candida glabrata,Fks1,,,Caspofungin,D632E,...,D632E,,>2 ug/mL,Fks1,D,632.0,E,646.0,D,D646E


In [57]:
FKS1HS1 = FKS_filtered[FKS_filtered.pos_cerevisiae.isin(np.arange(639,648))].reset_index(drop=True)
FKS1HS1.drop(FKS1HS1[FKS1HS1['original mutation'].str.contains(',|and', regex=True)].index, inplace=True)
FKS1HS1

Unnamed: 0,first author name,journal,year,pubmedid,species,gene or protein name,accession number for protein name,source,drug,mutation,...,original mutation,original origin,original MIC,ortho_homolog,wt_AA,position,alt_AA,pos_cerevisiae,aa_cerevisiae,mutation_cerevisiae
0,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,18443110,Saccharomyces cerevisiae,Fks1,AAC48981,,Caspofungin,P647A,...,P647A,Lab,,Fks1,P,647.0,A,647.0,P,P647A
1,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,18443110,Saccharomyces cerevisiae,Fks1,AAC48981,,Micafungin,P647A,...,P647A,Lab,,Fks1,P,647.0,A,647.0,P,P647A
2,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,18443110,Saccharomyces cerevisiae,Fks1,AAC48981,,Anidulafungin,P647A,...,P647A,Lab,,Fks1,P,647.0,A,647.0,P,P647A
3,Zhu,Journal of Clinical Microbiology,2023,36975998,Candida auris,Fks1,,,Anidulafungin,S639Y,...,S639Y,Clinical,,Fks1,S,639.0,Y,643.0,S,S643Y
4,Zhu,Journal of Clinical Microbiology,2023,36975998,Candida auris,Fks1,,,Anidulafungin,S639F,...,S639F,Clinical,,Fks1,S,639.0,F,643.0,S,S643F
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
381,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2010,20145084,Candida albicans,Fks1,,,Caspofungin,S645P,...,S645P,,8 ug/mL,Fks1,S,645.0,P,643.0,S,S643P
382,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2010,20145084,Candida albicans,Fks1,,,Micafungin,S645P,...,S645P,,4 ug/mL,Fks1,S,645.0,P,643.0,S,S643P
383,Cleary,Antimicrobial Agents and Chemotherapy,2008,18378714,Candida glabrata,Fks1,,,Anidulafungin,D632E,...,D632E,,>2 ug/mL,Fks1,D,632.0,E,646.0,D,D646E
384,Cleary,Antimicrobial Agents and Chemotherapy,2008,18378714,Candida glabrata,Fks1,,,Caspofungin,D632E,...,D632E,,>2 ug/mL,Fks1,D,632.0,E,646.0,D,D646E


In [65]:
cross_resistance = FKS1HS1.groupby(['mutation_cerevisiae','drug','degree of evidence']).size().reset_index(name='nb_entries')
cross_resistance

Unnamed: 0,mutation_cerevisiae,drug,degree of evidence,nb_entries
0,D646E,Anidulafungin,8.0,4
1,D646E,Caspofungin,8.0,4
2,D646E,Micafungin,8.0,4
3,D646G,Anidulafungin,-8.0,1
4,D646G,Caspofungin,8.0,1
...,...,...,...,...
101,S643Y,Caspofungin,4.0,2
102,S643Y,Caspofungin,7.0,1
103,S643Y,Caspofungin,8.0,4
104,S643Y,Micafungin,4.0,1


In [68]:
cross_resistance[cross_resistance['degree of evidence'] < 0]

Unnamed: 0,mutation_cerevisiae,drug,degree of evidence,nb_entries
3,D646G,Anidulafungin,-8.0,1
5,D646G,Micafungin,-8.0,1
6,D646H,Anidulafungin,-8.0,1
7,D646H,Caspofungin,-8.0,1
8,D646H,Micafungin,-8.0,1
12,D646Y,Anidulafungin,-8.0,2
14,D646Y,Caspofungin,-8.0,2
16,D646Y,Micafungin,-8.0,2
22,F639I,Anidulafungin,-8.0,1
24,F639I,Micafungin,-8.0,1


In [22]:
mardymut_df = FKS1HS1[FKS1HS1['gene or protein name']!='Fks1/2'][['first author name', 'journal', 'year', 'species', 'gene or protein name', 'drug', 'mutation', 'degree of evidence', 'MIC', 'strain_ID', 'strain origin if available', 'notes', 'mutation_cerevisiae']]
mardymut_df

Unnamed: 0,first author name,journal,year,species,gene or protein name,drug,mutation,degree of evidence,MIC,strain_ID,strain origin if available,notes,mutation_cerevisiae
0,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,Saccharomyces cerevisiae,Fks1,Caspofungin,P647A,2.0,0.5 μg/mL,BY4742,Lab,"CLSI with YPD, The equivalent in Candida parap...",P647A
1,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,Saccharomyces cerevisiae,Fks1,Micafungin,P647A,2.0,0.5 μg/mL,BY4742,Lab,"CLSI with YPD, The equivalent in Candida parap...",P647A
2,Garcia-Effron,Antimicrobial Agents and Chemotherapy,2008,Saccharomyces cerevisiae,Fks1,Anidulafungin,P647A,2.0,0.5 μg/mL,BY4742,Lab,"CLSI with YPD, The equivalent in Candida parap...",P647A
89,Park,Antimicrobial Agents and Chemotherapy,2005,Candida albicans,Fks1,Caspofungin,S645P,1.0,2 μg/mL,Transformant 1,Lab,,S643P
90,Park,Antimicrobial Agents and Chemotherapy,2005,Candida albicans,Fks1,Caspofungin,S645P,1.0,2 μg/mL,Transformant 2,Lab,,S643P
91,Park,Antimicrobial Agents and Chemotherapy,2005,Candida albicans,Fks1,Caspofungin,S645P,1.0,2 μg/mL,Transformant 3,Lab,,S643P
92,Park,Antimicrobial Agents and Chemotherapy,2005,Candida albicans,Fks1,Caspofungin,S645P,1.0,2 μg/mL,Transformant 8,Lab,,S643P
93,Park,Antimicrobial Agents and Chemotherapy,2005,Candida albicans,Fks1,Caspofungin,S645P,1.0,4 μg/mL,pJAM11 in CAI4-R1,Lab,,S643P
313,Avramovska,Frontiers in Fungal Biology,2022,Candida albicans,Fks1,Caspofungin,F641C,4.0,Not determined,MH84 (2N),Evolved,Looked at FKS1 as candidate gene; MIC values p...,F639C
315,Avramovska,Frontiers in Fungal Biology,2022,Candida albicans,Fks1,Caspofungin,S645F,4.0,Not determined,MH128 (4N),Evolved,Looked at FKS1 as candidate gene; MIC values p...,S643F


In [23]:
mardymut_df.to_csv('mardymut_df.csv')

In [24]:
mardy_mut = mardymut_df.mutation_cerevisiae.unique()
print(len(mardy_mut), mardy_mut)

11 ['P647A' 'S643P' 'F639C' 'S643F' 'S643Y' 'F639del' 'L642Y' 'F639V' 'F639S'
 'L642F' 'S643C']


In [25]:
print(mardymut_df.species.unique())

['Saccharomyces cerevisiae' 'Candida albicans' 'Candida glabrata'
 'Aspergillus fumigatus' 'Candida lusitaniae' 'Candida parapsilosis'
 'Candida metapsilosis']


In [26]:
print(mardymut_df['degree of evidence'].unique())

[2. 1. 4.]
