# Libraries

In [1]:
import pandas as pd

# Data

In [2]:
# Import data
data = pd.read_csv("../data/data.csv")

# Analyze

In [3]:
def find_arv_proportion(dataset, arv_name):
    """
    Function finds proportion of patients taking specified ARV
    Input: dataset (dataframe) and arv_name (str)
    Output: fraction as string, percentage as decimal
    """
    total = len(dataset[(dataset["hiv_status"] == 1) & (dataset["on_arv"] == 1)]["patient_id"])
    taking_arv = len(dataset[(dataset[arv_name] == 1) &
                             (dataset["hiv_status"] == 1)]["patient_id"])
    return (arv_name, ("{}/{}").format(str(taking_arv), str(total)), round(taking_arv/total*100, 3))

In [None]:
small_data = data[-181:]

# ARVs only in small data
print(find_arv_proportion(small_data, "abacavir"))
print(find_arv_proportion(small_data, "lamivudine"))
print(find_arv_proportion(small_data, "stavudine"))
print(find_arv_proportion(small_data, "tdf"))
#print(find_arv_proportion(small_data, "azt"))
#print(find_arv_proportion(small_data, "zidovudine"))
print(find_arv_proportion(small_data, "gazt"))
print(find_arv_proportion(small_data, "efavirenz"))
print(find_arv_proportion(small_data, "nevirapine"))
print(find_arv_proportion(small_data, "combivir"))
print(find_arv_proportion(small_data, "atripla"))
print(find_arv_proportion(small_data, "aluvia"))
print(find_arv_proportion(small_data, "truvada"))

In [None]:
large_data = data[:-181]

# ARVs in small data, computed only for large data patients
print(find_arv_proportion(large_data, "abacavir"))
print(find_arv_proportion(large_data, "lamivudine"))
print(find_arv_proportion(large_data, "stavudine"))
print(find_arv_proportion(large_data, "tdf"))
#print(find_arv_proportion(large_data, "azt"))
#print(find_arv_proportion(large_data, "zidovudine"))
print(find_arv_proportion(large_data, "gazt"))
print(find_arv_proportion(large_data, "efavirenz"))
print(find_arv_proportion(large_data, "nevirapine"))
print(find_arv_proportion(large_data, "combivir"))
print(find_arv_proportion(large_data, "atripla"))
print(find_arv_proportion(large_data, "aluvia"))
print(find_arv_proportion(large_data, "truvada"))

# ARVs in large data only
print(find_arv_proportion(large_data, "zalcitabine"))
print(find_arv_proportion(large_data, "didanosine"))
print(find_arv_proportion(large_data, "dolutegravir"))
print(find_arv_proportion(large_data, "elvitegravir"))
print(find_arv_proportion(large_data, "emtricitabine"))
print(find_arv_proportion(large_data, "delavirdine"))
print(find_arv_proportion(large_data, "etravirine"))
print(find_arv_proportion(large_data, "rilpivirine"))
print(find_arv_proportion(large_data, "tld"))
print(find_arv_proportion(large_data, "amprenavir"))
print(find_arv_proportion(large_data, "atazanavir"))
print(find_arv_proportion(large_data, "atazanavir_boosted"))
print(find_arv_proportion(large_data, "darunavir"))
print(find_arv_proportion(large_data, "darunavir_boosted"))
print(find_arv_proportion(large_data, "fosamprenavir"))
print(find_arv_proportion(large_data, "fosamprenavir_boosted"))
print(find_arv_proportion(large_data, "indinavir"))
print(find_arv_proportion(large_data, "lopinavir"))
print(find_arv_proportion(large_data, "lopinavir_boosted"))
print(find_arv_proportion(large_data, "nelfinavir"))
print(find_arv_proportion(large_data, "ritonavir"))
print(find_arv_proportion(large_data, "saquinavir"))
print(find_arv_proportion(large_data, "saquinavir_boosted"))
print(find_arv_proportion(large_data, "tipranavir"))
print(find_arv_proportion(large_data, "tipranavir_boosted"))
print(find_arv_proportion(large_data, "maraviroc"))
print(find_arv_proportion(large_data, "raltegravir"))
print(find_arv_proportion(large_data, "enfuvirtide"))
print(find_arv_proportion(large_data, "cobicistat"))
print(find_arv_proportion(large_data, "zidovudine"))

In [None]:
# ARVs for all HIV pos patients

print(find_arv_proportion(data, "abacavir"))
print(find_arv_proportion(data, "lamivudine"))
print(find_arv_proportion(data, "stavudine"))
print(find_arv_proportion(data, "tdf"))
print(find_arv_proportion(data, "gazt"))
print(find_arv_proportion(data, "zidovudine"))
print(find_arv_proportion(data, "efavirenz"))
print(find_arv_proportion(data, "nevirapine"))
print(find_arv_proportion(data, "combivir"))
print(find_arv_proportion(data, "atripla"))
print(find_arv_proportion(data, "aluvia"))
print(find_arv_proportion(data, "truvada"))
print(find_arv_proportion(data, "tld"))

In [None]:
# These ARVs were not in the our categorization tables due to questions
print(find_arv_proportion(data, "cobicistat"))
large = pd.read_csv("../data/large_data.csv")
find_arv_proportion(large, "enfuvirtide")

In [None]:
# ARV groupings
print(find_arv_proportion(data, "nrti"))
print(find_arv_proportion(data, "nnrti"))
print(find_arv_proportion(data, "pi"))