# Create dynamic table for Top 50 interactions for COAD

In [None]:
import ipywidgets as widgets
from ipywidgets import interact, interact_manual
import pandas as pd
import numpy as np

In [None]:
# get data
database = "../db/dbCOAD-DRD.csv"

In [None]:
df = pd.read_csv(database)
df

In [None]:
# order by AE and get only AE < -8.5 kcal/mol
df_repurposing = df[df['AE']<=-8.5]

# get only the best 50 interactions
df_repurposing = df_repurposing.head(50) 

# use other order of columns
df_repurposing = df_repurposing[['AE', 'HGNC_symbol', 'DrugName', 'ProteinID', 'DrugCID', 'Drug']]
df_repurposing

From 23272 interactions (pairs of PDB - compound), we selected only the best 50 interactions with AE < -8.5 kcal/mol.

In [None]:
# data export to HTML
print(df_repurposing.to_html())

In [None]:
# saving as HTML file the same result
fout = open("../extras/top50_table.html","w")
fout.write(df_repurposing.to_html(index=False))
fout.close() 

In [None]:
# counting the elements
print('No of genes:', len(list(set(df_repurposing['HGNC_symbol']))))
print('No of PDBs:', len(list(set(df_repurposing['ProteinID']))))
print('No of drug names:', len(list(set(df_repurposing['DrugName']))))
print('No of drug compounds:', len(list(set(df_repurposing['DrugCID']))))

In [None]:
# save dataset with Top50
df_repurposing.to_csv("../db/dbCOAD-DRD_Top50.csv", index=False)