# **SETUP & IMPORTS**

In [None]:
!pip install pycountry
!pip install kaggle

In [None]:
import os

# Data handling
import pandas as pd
import numpy as np
from sklearn.linear_model import LinearRegression


# Visualization
import matplotlib.pyplot as plt
import seaborn as sns

# Machine learning
from sklearn.preprocessing import StandardScaler
from sklearn.cluster import KMeans
from sklearn.decomposition import PCA, TruncatedSVD
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import classification_report, confusion_matrix
from sklearn.feature_extraction.text import TfidfVectorizer

# Association rules
from mlxtend.frequent_patterns import apriori, association_rules

# Time series
import statsmodels as sm



## **IMPORTING KAGGLE DATASET**

In [None]:
from google.colab import files
files.upload()   # upload kaggle.json here


!mkdir -p ~/.kaggle
!cp kaggle.json ~/.kaggle/
!chmod 600 ~/.kaggle/kaggle.json


!kaggle datasets download -d amohankumar/global-nutrition-adult-and-adolescent-dataset
!unzip global-nutrition-adult-and-adolescent-dataset.zip
country_dietary = pd.read_csv("Country Dietary Needs.csv")
country_dietary


## **IMPORTING WHO DATASET**

In [None]:
DATA_LINKS = {
    "adult_obesity_age_standardized": "https://ghoapi.azureedge.net/api/NCD_BMI_30C",
    "child_adolescent_obesity_crude": "https://ghoapi.azureedge.net/api/NCD_BMI_PLUS2C",
    "under5_overweight_prevalence": "https://ghoapi.azureedge.net/api/NUTRITION_ANT_WHZ_NE2",
    "under5_wasting_prevalence": "https://ghoapi.azureedge.net/api/NUTRITION_WH_2",
    "under5_stunting_prevalence": "https://ghoapi.azureedge.net/api/NUTRITION_ANT_HAZ_NE2",
    "sugar_availability_per_capita": "https://ghoapi.azureedge.net/api/ORALHEALTH_SUGAR_AVAILABILITY"
}

In [None]:
def load_csv(path_or_url, nrows=None):
    x = pd.read_json(path_or_url, nrows=nrows)
    return pd.json_normalize(x['value'])

In [None]:
adult_obesity_age_standardized = load_csv(DATA_LINKS['adult_obesity_age_standardized'])
child_adolescent_obesity_crude = load_csv(DATA_LINKS['child_adolescent_obesity_crude'])
under5_overweight_prevalence = load_csv(DATA_LINKS['under5_overweight_prevalence'])
under5_wasting_prevalence = load_csv(DATA_LINKS['under5_wasting_prevalence'])
under5_stunting_prevalence = load_csv(DATA_LINKS['under5_stunting_prevalence'])
sugar_availability_per_capita = load_csv(DATA_LINKS['sugar_availability_per_capita'])