In [9]:
# Import modules
import os
import pandas as pd
import rdkit
# from rdkit.Chem import Draw
# from rdkit.Chem.Draw import IPythonConsole
from rdkit.Chem import Descriptors
from rdkit.Chem.MolStandardize import rdMolStandardize

# Expand to see all columns
pd.set_option('display.max_columns', None)

# Suppress RDKit Output
rdkit.RDLogger.DisableLog('rdApp.*')

# Print versions
print(f"Pandas Version: {pd.__version__}")
print(f"RDKit Version: {rdkit.__version__}")

Pandas Version: 2.2.3
RDKit Version: 2024.09.6


In [10]:
# Paths
path_data = os.path.realpath("../data")
input_file = "chembl_approved_small_molecule_drugs.csv"
output_file = "chembl_approved_small_molecule_drugs_rdkit-profiled.csv"
input_path = os.path.join(path_data, input_file)
output_path = os.path.join(path_data, output_file)

# Load CSV
df = pd.read_csv(input_path)
df.head()

Unnamed: 0,chembl_molecule_id,smiles,molregno,pref_name,max_phase,therapeutic_flag,dosed_ingredient,structure_type,chebi_par_id,molecule_type,first_approval,oral,parenteral,topical,black_box_warning,natural_product,first_in_class,chirality,prodrug,inorganic_flag,usan_year,availability_type,usan_stem,polymer_flag,usan_substem,usan_stem_definition,indication_class,withdrawn_flag,chemical_probe,orphan,mw_freebase,alogp,hba,hbd,psa,rtb,ro3_pass,num_ro5_violations,cx_most_apka,cx_most_bpka,cx_logp,cx_logd,molecular_species,full_mwt,aromatic_rings,heavy_atoms,qed_weighted,mw_monoisotopic,full_molformula,hba_lipinski,hbd_lipinski,num_lipinski_ro5_violations,np_likeness_score
0,CHEMBL1200542,CC(=O)OCC(=O)[C@H]1CC[C@H]2[C@@H]3CCC4=CC(=O)C...,674493,DESOXYCORTICOSTERONE ACETATE,4.0,1,1,MOL,34671.0,Small molecule,1939.0,0,1,0,0,1,0,1,0,0,,0.0,-cort-; -ster-; -terone,0,-cort-; -ster-; -terone,"cortisone derivatives; steroids (androgens, an...",Adrenocortical Steroid (salt-regulating),0,0,0,372.51,4.27,4.0,0.0,60.44,3.0,N,0.0,,,3.77,3.77,NEUTRAL,372.51,0.0,27.0,0.69,372.2301,C23H32O4,4.0,0.0,0.0,1.96
1,CHEMBL1200728,Cl.N=C(N)N,674679,GUANIDINE HYDROCHLORIDE,4.0,1,1,MOL,32735.0,Small molecule,1939.0,1,0,0,0,0,0,2,0,0,,1.0,guan-,0,guan-,antihypertensives (guanidine derivatives),,0,0,0,59.07,-1.16,1.0,3.0,75.89,0.0,N,0.0,,12.55,-1.24,-3.65,BASE,95.53,0.0,4.0,0.24,59.0483,CH6ClN3,3.0,5.0,0.0,0.32
2,CHEMBL1200982,CCC(C)C1(CC)C(=O)[N-]C(=O)NC1=O.[Na+],674933,BUTABARBITAL SODIUM,4.0,1,1,MOL,,Small molecule,1939.0,1,0,0,0,0,0,0,0,0,,1.0,-barb-,0,-barb-,barbituric acid derivatives,Sedative-Hypnotic,0,0,0,212.25,0.79,3.0,2.0,75.27,3.0,N,0.0,7.48,,1.45,1.19,NEUTRAL,234.23,0.0,15.0,0.68,212.1161,C10H15N2NaO3,5.0,2.0,0.0,0.32
3,CHEMBL3989520,NCCc1c[nH]cn1.O=P(O)(O)O.O=P(O)(O)O,2197391,HISTAMINE PHOSPHATE,4.0,1,1,MOL,,Small molecule,1939.0,0,1,0,1,0,0,2,0,0,,0.0,,0,,,,0,0,0,111.15,-0.09,2.0,2.0,54.7,2.0,Y,0.0,,9.58,-0.7,-2.85,BASE,307.14,1.0,8.0,0.56,111.0796,C5H15N3O8P2,3.0,3.0,0.0,0.0
4,CHEMBL449,CCC(C)C1(CC)C(=O)NC(=O)NC1=O,2393,BUTABARBITAL,4.0,1,0,MOL,3228.0,Small molecule,1939.0,1,0,0,0,1,0,0,0,0,,1.0,-barb-,0,-barb-,barbituric acid derivatives,Sedative-Hypnotic,0,0,0,212.25,0.79,3.0,2.0,75.27,3.0,N,0.0,7.48,,1.45,1.19,NEUTRAL,212.25,0.0,15.0,0.68,212.1161,C10H16N2O3,5.0,2.0,0.0,0.32


In [11]:
largest_frag_app = rdMolStandardize.LargestFragmentChooser()
uncharge_app = rdMolStandardize.Uncharger()
mols = []
skipped_indices = []
for ii, smi in enumerate(df["smiles"]):
    try:
        mol = rdkit.Chem.MolFromSmiles(
            smi,
            sanitize = False
        )
        assert mol is not None
    except Exception as e:
        skipped_indices.append(ii)
        if pd.notna(smi):
            print(f"Error processing SMILES at index {ii}: {smi}")
            print(f"Exception: {e}")
        continue
    try:
        rdkit.Chem.SanitizeMol(mol)
        largest_frag_app.chooseInPlace(mol)
        uncharge_app.unchargeInPlace(mol)
    except Exception as e:
        skipped_indices.append(ii)
        print(f"Error processing molecule at index {ii}")
        print(f"Exception: {e}")
        continue
    descriptors = {
        "idx": ii,
        "SMILES": rdkit.Chem.MolToSmiles(mol),
    }
    for descriptor, fxn in Descriptors._descList:
        try:
            value = fxn(mol)
        except Exception as e:
            # print(f"Error calculating {descriptor} at index {ii}")
            # print(f"Exception: {e}")
            value = None
        descriptors[f"rdkit_{descriptor}"] = value
    mols.append(descriptors)

print(f"{len(mols)}/{df.shape[0]} molecules processed!")
print(f"{df.shape[0]-len(mols)}/{df.shape[0]} molecules skipped!")

3382/3517 molecules processed!
135/3517 molecules skipped!


In [12]:
column_update = { cc: f"chembl_{cc}" for cc in df.columns[1:] }
df = df.rename(columns=column_update)
# for mol_dict in mols:
#     idx = mol_dict["idx"]
#     for key, value in mol_dict.items():
#         if key != "idx":
#             col = key if key == "SMILES" else key.lower()
#             df.loc[idx, col] = value
# Convert list of dictionaries to a DataFrame
mol_df = pd.DataFrame(mols)
mol_df.set_index("idx", inplace=True)

mol_df.columns = [ col if col == "SMILES" else col.lower() 
                   for col in mol_df.columns ]

df = pd.concat([df, mol_df], axis=1)
cols = df.columns.tolist()
cols.remove('SMILES')
cols.insert(0, 'SMILES')
df = df[cols]

# Display results
df.head()

Unnamed: 0,SMILES,chembl_molecule_id,chembl_smiles,chembl_molregno,chembl_pref_name,chembl_max_phase,chembl_therapeutic_flag,chembl_dosed_ingredient,chembl_structure_type,chembl_chebi_par_id,chembl_molecule_type,chembl_first_approval,chembl_oral,chembl_parenteral,chembl_topical,chembl_black_box_warning,chembl_natural_product,chembl_first_in_class,chembl_chirality,chembl_prodrug,chembl_inorganic_flag,chembl_usan_year,chembl_availability_type,chembl_usan_stem,chembl_polymer_flag,chembl_usan_substem,chembl_usan_stem_definition,chembl_indication_class,chembl_withdrawn_flag,chembl_chemical_probe,chembl_orphan,chembl_mw_freebase,chembl_alogp,chembl_hba,chembl_hbd,chembl_psa,chembl_rtb,chembl_ro3_pass,chembl_num_ro5_violations,chembl_cx_most_apka,chembl_cx_most_bpka,chembl_cx_logp,chembl_cx_logd,chembl_molecular_species,chembl_full_mwt,chembl_aromatic_rings,chembl_heavy_atoms,chembl_qed_weighted,chembl_mw_monoisotopic,chembl_full_molformula,chembl_hba_lipinski,chembl_hbd_lipinski,chembl_num_lipinski_ro5_violations,chembl_np_likeness_score,rdkit_maxabsestateindex,rdkit_maxestateindex,rdkit_minabsestateindex,rdkit_minestateindex,rdkit_qed,rdkit_sps,rdkit_molwt,rdkit_heavyatommolwt,rdkit_exactmolwt,rdkit_numvalenceelectrons,rdkit_numradicalelectrons,rdkit_maxpartialcharge,rdkit_minpartialcharge,rdkit_maxabspartialcharge,rdkit_minabspartialcharge,rdkit_fpdensitymorgan1,rdkit_fpdensitymorgan2,rdkit_fpdensitymorgan3,rdkit_bcut2d_mwhi,rdkit_bcut2d_mwlow,rdkit_bcut2d_chghi,rdkit_bcut2d_chglo,rdkit_bcut2d_logphi,rdkit_bcut2d_logplow,rdkit_bcut2d_mrhi,rdkit_bcut2d_mrlow,rdkit_avgipc,rdkit_balabanj,rdkit_bertzct,rdkit_chi0,rdkit_chi0n,rdkit_chi0v,rdkit_chi1,rdkit_chi1n,rdkit_chi1v,rdkit_chi2n,rdkit_chi2v,rdkit_chi3n,rdkit_chi3v,rdkit_chi4n,rdkit_chi4v,rdkit_hallkieralpha,rdkit_ipc,rdkit_kappa1,rdkit_kappa2,rdkit_kappa3,rdkit_labuteasa,rdkit_peoe_vsa1,rdkit_peoe_vsa10,rdkit_peoe_vsa11,rdkit_peoe_vsa12,rdkit_peoe_vsa13,rdkit_peoe_vsa14,rdkit_peoe_vsa2,rdkit_peoe_vsa3,rdkit_peoe_vsa4,rdkit_peoe_vsa5,rdkit_peoe_vsa6,rdkit_peoe_vsa7,rdkit_peoe_vsa8,rdkit_peoe_vsa9,rdkit_smr_vsa1,rdkit_smr_vsa10,rdkit_smr_vsa2,rdkit_smr_vsa3,rdkit_smr_vsa4,rdkit_smr_vsa5,rdkit_smr_vsa6,rdkit_smr_vsa7,rdkit_smr_vsa8,rdkit_smr_vsa9,rdkit_slogp_vsa1,rdkit_slogp_vsa10,rdkit_slogp_vsa11,rdkit_slogp_vsa12,rdkit_slogp_vsa2,rdkit_slogp_vsa3,rdkit_slogp_vsa4,rdkit_slogp_vsa5,rdkit_slogp_vsa6,rdkit_slogp_vsa7,rdkit_slogp_vsa8,rdkit_slogp_vsa9,rdkit_tpsa,rdkit_estate_vsa1,rdkit_estate_vsa10,rdkit_estate_vsa11,rdkit_estate_vsa2,rdkit_estate_vsa3,rdkit_estate_vsa4,rdkit_estate_vsa5,rdkit_estate_vsa6,rdkit_estate_vsa7,rdkit_estate_vsa8,rdkit_estate_vsa9,rdkit_vsa_estate1,rdkit_vsa_estate10,rdkit_vsa_estate2,rdkit_vsa_estate3,rdkit_vsa_estate4,rdkit_vsa_estate5,rdkit_vsa_estate6,rdkit_vsa_estate7,rdkit_vsa_estate8,rdkit_vsa_estate9,rdkit_fractioncsp3,rdkit_heavyatomcount,rdkit_nhohcount,rdkit_nocount,rdkit_numaliphaticcarbocycles,rdkit_numaliphaticheterocycles,rdkit_numaliphaticrings,rdkit_numamidebonds,rdkit_numaromaticcarbocycles,rdkit_numaromaticheterocycles,rdkit_numaromaticrings,rdkit_numatomstereocenters,rdkit_numbridgeheadatoms,rdkit_numhacceptors,rdkit_numhdonors,rdkit_numheteroatoms,rdkit_numheterocycles,rdkit_numrotatablebonds,rdkit_numsaturatedcarbocycles,rdkit_numsaturatedheterocycles,rdkit_numsaturatedrings,rdkit_numspiroatoms,rdkit_numunspecifiedatomstereocenters,rdkit_phi,rdkit_ringcount,rdkit_mollogp,rdkit_molmr,rdkit_fr_al_coo,rdkit_fr_al_oh,rdkit_fr_al_oh_notert,rdkit_fr_arn,rdkit_fr_ar_coo,rdkit_fr_ar_n,rdkit_fr_ar_nh,rdkit_fr_ar_oh,rdkit_fr_coo,rdkit_fr_coo2,rdkit_fr_c_o,rdkit_fr_c_o_nocoo,rdkit_fr_c_s,rdkit_fr_hoccn,rdkit_fr_imine,rdkit_fr_nh0,rdkit_fr_nh1,rdkit_fr_nh2,rdkit_fr_n_o,rdkit_fr_ndealkylation1,rdkit_fr_ndealkylation2,rdkit_fr_nhpyrrole,rdkit_fr_sh,rdkit_fr_aldehyde,rdkit_fr_alkyl_carbamate,rdkit_fr_alkyl_halide,rdkit_fr_allylic_oxid,rdkit_fr_amide,rdkit_fr_amidine,rdkit_fr_aniline,rdkit_fr_aryl_methyl,rdkit_fr_azide,rdkit_fr_azo,rdkit_fr_barbitur,rdkit_fr_benzene,rdkit_fr_benzodiazepine,rdkit_fr_bicyclic,rdkit_fr_diazo,rdkit_fr_dihydropyridine,rdkit_fr_epoxide,rdkit_fr_ester,rdkit_fr_ether,rdkit_fr_furan,rdkit_fr_guanido,rdkit_fr_halogen,rdkit_fr_hdrzine,rdkit_fr_hdrzone,rdkit_fr_imidazole,rdkit_fr_imide,rdkit_fr_isocyan,rdkit_fr_isothiocyan,rdkit_fr_ketone,rdkit_fr_ketone_topliss,rdkit_fr_lactam,rdkit_fr_lactone,rdkit_fr_methoxy,rdkit_fr_morpholine,rdkit_fr_nitrile,rdkit_fr_nitro,rdkit_fr_nitro_arom,rdkit_fr_nitro_arom_nonortho,rdkit_fr_nitroso,rdkit_fr_oxazole,rdkit_fr_oxime,rdkit_fr_para_hydroxylation,rdkit_fr_phenol,rdkit_fr_phenol_noorthohbond,rdkit_fr_phos_acid,rdkit_fr_phos_ester,rdkit_fr_piperdine,rdkit_fr_piperzine,rdkit_fr_priamide,rdkit_fr_prisulfonamd,rdkit_fr_pyridine,rdkit_fr_quatn,rdkit_fr_sulfide,rdkit_fr_sulfonamd,rdkit_fr_sulfone,rdkit_fr_term_acetylene,rdkit_fr_tetrazole,rdkit_fr_thiazole,rdkit_fr_thiocyan,rdkit_fr_thiophene,rdkit_fr_unbrch_alkane,rdkit_fr_urea
0,CC(=O)OCC(=O)[C@H]1CC[C@H]2[C@@H]3CCC4=CC(=O)C...,CHEMBL1200542,CC(=O)OCC(=O)[C@H]1CC[C@H]2[C@@H]3CCC4=CC(=O)C...,674493,DESOXYCORTICOSTERONE ACETATE,4.0,1,1,MOL,34671.0,Small molecule,1939.0,0,1,0,0,1,0,1,0,0,,0.0,-cort-; -ster-; -terone,0,-cort-; -ster-; -terone,"cortisone derivatives; steroids (androgens, an...",Adrenocortical Steroid (salt-regulating),0,0,0,372.51,4.27,4.0,0.0,60.44,3.0,N,0.0,,,3.77,3.77,NEUTRAL,372.51,0.0,27.0,0.69,372.2301,C23H32O4,4.0,0.0,0.0,1.96,12.773246,12.773246,0.028221,-0.376735,0.694387,43.222222,372.505,340.249,372.23006,148.0,0.0,0.302564,-0.45786,0.45786,0.302564,1.074074,1.851852,2.592593,16.534689,9.46484,2.595559,-2.576012,2.661677,-2.509003,5.913122,-0.148809,2.972962,1.555075,707.166909,19.396977,16.883706,16.883706,12.753691,10.654649,10.654649,9.889871,9.889871,8.768376,8.768376,7.361606,7.361606,-1.45,1338475.0,18.892162,6.562307,2.905355,161.653161,4.736863,6.606882,11.56649,0.0,0.0,5.969305,14.383612,0.0,0.0,0.0,19.420579,79.605471,19.262465,0.0,19.120475,17.535795,0.0,0.0,34.501605,72.137785,6.606882,11.649125,0.0,0.0,0.0,0.0,0.0,0.0,24.142677,19.120475,34.501605,72.137785,11.649125,0.0,0.0,0.0,60.44,0.0,14.383612,0.0,35.107319,29.957785,44.945751,12.496842,0.0,6.07602,13.847474,4.736863,5.016332,0.0,35.806943,0.0,1.613361,1.950787,0.0,10.110728,6.001849,0.0,0.782609,27.0,0.0,4.0,4.0,0.0,4.0,0.0,0.0,0.0,0.0,6.0,0.0,4.0,0.0,4.0,0.0,3.0,3.0,0.0,3.0,0.0,0.0,4.59171,4.0,4.2667,101.84,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,N=C(N)N,CHEMBL1200728,Cl.N=C(N)N,674679,GUANIDINE HYDROCHLORIDE,4.0,1,1,MOL,32735.0,Small molecule,1939.0,1,0,0,0,0,0,2,0,0,,1.0,guan-,0,guan-,antihypertensives (guanidine derivatives),,0,0,0,59.07,-1.16,1.0,3.0,75.89,0.0,N,0.0,,12.55,-1.24,-3.65,BASE,95.53,0.0,4.0,0.24,59.0483,CH6ClN3,3.0,5.0,0.0,0.32,6.055556,6.055556,0.333333,-0.333333,0.242956,,59.072,54.032,59.048347,24.0,0.0,0.182528,-0.370334,0.370334,0.182528,,,,14.880242,11.13969,1.520757,-1.686834,1.131063,-2.19535,5.713256,1.386203,0.811278,2.803039,26.264663,3.57735,2.154701,2.154701,1.732051,0.82735,0.82735,0.455342,0.455342,0.0,0.0,0.0,0.0,-0.73,3.245112,3.27,0.710529,0.173734,24.104383,11.467335,0.0,5.959555,0.0,0.0,0.0,5.409284,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.959555,5.409284,0.0,11.467335,0.0,0.0,0.0,0.0,0.0,11.467335,0.0,0.0,0.0,5.959555,0.0,5.409284,0.0,0.0,0.0,0.0,0.0,,0.0,0.0,0.0,5.959555,0.0,0.0,0.0,0.0,0.0,11.467335,5.409284,0.0,0.0,0.0,6.055556,8.944444,-0.333333,0.0,0.0,0.0,0.0,0.0,4.0,5.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,3.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.580857,0.0,-1.16143,16.1015,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,CCC(C)C1(CC)C(=O)NC(=O)NC1=O,CHEMBL1200982,CCC(C)C1(CC)C(=O)[N-]C(=O)NC1=O.[Na+],674933,BUTABARBITAL SODIUM,4.0,1,1,MOL,,Small molecule,1939.0,1,0,0,0,0,0,0,0,0,,1.0,-barb-,0,-barb-,barbituric acid derivatives,Sedative-Hypnotic,0,0,0,212.25,0.79,3.0,2.0,75.27,3.0,N,0.0,7.48,,1.45,1.19,NEUTRAL,234.23,0.0,15.0,0.68,212.1161,C10H15N2NaO3,5.0,2.0,0.0,0.32,11.775694,11.775694,0.087407,-1.094583,0.679143,,212.249,196.121,212.116092,84.0,0.0,0.327632,-0.276814,0.327632,0.276814,,,,16.197656,9.702763,2.51351,-2.368754,2.35253,-2.638437,6.188352,-0.148048,2.169489,3.105335,291.789362,11.637828,9.216309,9.216309,6.984435,5.154413,5.154413,3.871574,3.871574,3.2758,3.2758,2.029272,2.029272,-1.39,1757.286,11.683475,4.001507,1.619083,88.60219,0.0,5.41499,0.0,11.814359,0.0,6.031115,20.222652,4.794537,0.0,0.0,27.192033,12.338728,0.0,0.0,14.383612,17.845474,0.0,10.633577,11.332897,33.612855,0.0,0.0,0.0,0.0,10.633577,4.794537,0.0,0.0,17.845474,9.589074,11.332897,33.612855,0.0,0.0,0.0,0.0,,23.260464,14.383612,0.0,5.917906,12.841643,0.0,0.0,6.923737,13.847474,10.633577,0.0,0.0,0.0,34.486026,4.313889,-1.094583,-1.04463,-0.72465,1.106968,5.540314,0.0,0.7,15.0,2.0,5.0,0.0,0.0,0.0,,0.0,0.0,0.0,1.0,0.0,3.0,2.0,5.0,1.0,3.0,0.0,1.0,1.0,0.0,1.0,3.116767,1.0,0.7949,53.8604,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,3.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0
3,NCCc1c[nH]cn1,CHEMBL3989520,NCCc1c[nH]cn1.O=P(O)(O)O.O=P(O)(O)O,2197391,HISTAMINE PHOSPHATE,4.0,1,1,MOL,,Small molecule,1939.0,0,1,0,1,0,0,2,0,0,,0.0,,0,,,,0,0,0,111.15,-0.09,2.0,2.0,54.7,2.0,Y,0.0,,9.58,-0.7,-2.85,BASE,307.14,1.0,8.0,0.56,111.0796,C5H15N3O8P2,3.0,3.0,0.0,0.0,5.265833,5.265833,0.671481,0.671481,0.560082,9.625,111.148,102.076,111.079647,44.0,0.0,0.092256,-0.350904,0.350904,0.092256,,,,14.853819,10.337599,1.874237,-1.845221,1.877082,-2.017761,4.933367,0.934888,2.185861,2.500249,133.393828,5.819991,4.593478,4.593478,3.931852,2.609633,2.609633,1.599216,1.599216,0.955332,0.955332,0.57551,0.57551,-0.83,107.1072,5.30947,2.470712,1.069114,47.929986,10.717646,0.0,0.0,0.0,0.0,0.0,0.0,4.983979,0.0,0.0,0.0,6.544756,12.617665,12.021248,0.0,0.0,0.0,9.967957,5.733667,6.420822,6.544756,18.218092,0.0,0.0,5.733667,0.0,0.0,0.0,16.512713,6.420822,0.0,5.693928,12.524164,0.0,0.0,0.0,,0.0,0.0,0.0,0.0,6.544756,12.11475,0.0,6.32732,6.196844,9.967957,5.733667,0.0,0.0,6.818287,0.0,6.300556,0.0,0.0,4.376343,0.671481,0.0,0.4,8.0,3.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,2.0,3.0,1.0,2.0,0.0,0.0,0.0,0.0,0.0,1.639771,1.0,-0.0891,31.3461,0.0,0.0,0.0,0.0,0.0,2.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
4,CCC(C)C1(CC)C(=O)NC(=O)NC1=O,CHEMBL449,CCC(C)C1(CC)C(=O)NC(=O)NC1=O,2393,BUTABARBITAL,4.0,1,0,MOL,3228.0,Small molecule,1939.0,1,0,0,0,1,0,0,0,0,,1.0,-barb-,0,-barb-,barbituric acid derivatives,Sedative-Hypnotic,0,0,0,212.25,0.79,3.0,2.0,75.27,3.0,N,0.0,7.48,,1.45,1.19,NEUTRAL,212.25,0.0,15.0,0.68,212.1161,C10H16N2O3,5.0,2.0,0.0,0.32,11.775694,11.775694,0.087407,-1.094583,0.679143,21.933333,212.249,196.121,212.116092,84.0,0.0,0.327632,-0.276814,0.327632,0.276814,1.133333,1.6,1.933333,16.197656,9.702763,2.51351,-2.368754,2.35253,-2.638437,6.188352,-0.148048,2.169489,3.105335,291.789362,11.637828,9.216309,9.216309,6.984435,5.154413,5.154413,3.871574,3.871574,3.2758,3.2758,2.029272,2.029272,-1.39,1757.286,11.683475,4.001507,1.619083,88.60219,0.0,5.41499,0.0,11.814359,0.0,6.031115,20.222652,4.794537,0.0,0.0,27.192033,12.338728,0.0,0.0,14.383612,17.845474,0.0,10.633577,11.332897,33.612855,0.0,0.0,0.0,0.0,10.633577,4.794537,0.0,0.0,17.845474,9.589074,11.332897,33.612855,0.0,0.0,0.0,0.0,75.27,23.260464,14.383612,0.0,5.917906,12.841643,0.0,0.0,6.923737,13.847474,10.633577,0.0,0.0,0.0,34.486026,4.313889,-1.094583,-1.04463,-0.72465,1.106968,5.540314,0.0,0.7,15.0,2.0,5.0,0.0,1.0,1.0,4.0,0.0,0.0,0.0,1.0,0.0,3.0,2.0,5.0,1.0,3.0,0.0,1.0,1.0,0.0,1.0,3.116767,1.0,0.7949,53.8604,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,3.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0
