In [1]:
import pandas as pd
import numpy as np
from additional_functions import *
import matplotlib.pyplot as plt
import plotly.express as px
import plotly.graph_objs as go


## READING DATA AND FIRST QUCIK TRANSFORMATIONS

In [135]:
internet_percentage = pd.read_csv('./data/internet_data.csv')
gdp_per_capita = pd.read_csv('./data/gdp_per_capita.csv')
fixed_broadband_subscription = pd.read_csv('./data/fixed_broadband_subscription.csv')
phone_per_citizen = pd.read_csv("./data/cellular_per_citizen.csv")

In [137]:
gdp_per_capita.drop(["Unnamed: 65", "Country Code", "Indicator Code", "Indicator Name"], axis=1, inplace=True)
fixed_broadband_subscription.drop(["Unnamed: 65", "Country Code", "Indicator Code", "Indicator Name"], axis=1, inplace=True)
internet_percentage.drop(["Country Code", "Indicator Code", "Indicator Name"], axis=1, inplace=True)
phone_per_citizen.drop(["Country Code", "Indicator Code", "Indicator Name"], axis=1, inplace=True)


In [138]:
gdp_per_capita.set_index(keys=["Country Name"], inplace=True)
fixed_broadband_subscription.set_index(keys=["Country Name"], inplace=True)
internet_percentage.set_index(keys=["Country Name"], inplace=True)
phone_per_citizen.set_index(keys=["Country Name"], inplace=True)


### CONVERTING ALL DATA INTO ONE FRAME FOR EASIER DATA VISUALIZATION

In [140]:
big_one = pd.DataFrame(columns=["Country", "GDP per capita", "Cellular per citizen", "Internet", "Broadband", "Year"])
columns = gdp_per_capita.columns[1:]
for column in columns:
    gdp = gdp_per_capita.loc[:,column]
    cellular = phone_per_citizen.loc[:,column]
    internet = internet_percentage.loc[:,column]
    broadband = fixed_broadband_subscription.loc[:,column]
    X = pd.concat([gdp, cellular, internet, broadband], axis=1)
    X.reset_index(inplace=True)
    X.loc[:,"Year"] = int(column)
    X.set_axis(['Country', 'GDP per capita', 'Cellular per citizen', 'Internet', 'Broadband', 'Year'], axis="columns", inplace=True)
    big_one = pd.concat([big_one, X], axis=0)
    big_one.reset_index(drop=True, inplace=True)

big_one.to_csv('./data/transformed.csv')

### READING DATA AND FURTHER TRANS AND VISUO

In [2]:
transformed = pd.read_csv('./data/transformed.csv')
transformed = transformed.loc[transformed['Year'] >= 2000,]
transformed.drop(['Unnamed: 0'], axis=1, inplace=True)
transformed.reset_index(drop=True, inplace=True)
transformed

Unnamed: 0,Country,GDP per capita,Cellular per citizen,Internet,Broadband,Year
0,Aruba,20617.750467,16.510187,15.442823,,2000
1,Africa Eastern and Southern,713.245921,2.515358,0.743922,,2000
2,Afghanistan,,0.000000,,,2000
3,Africa Western and Central,525.450343,0.535656,0.138961,,2000
4,Angola,556.838632,0.157397,0.105046,,2000
...,...,...,...,...,...,...
5581,Kosovo,4346.637931,,,,2020
5582,"Yemen, Rep.",,,,,2020
5583,South Africa,5655.867654,161.796592,,2.197076,2020
5584,Zambia,985.132436,103.917835,,0.447765,2020


In [3]:
transformed = transformed.loc[transformed['Country'].isin(['Albania', 'Poland', 'Germany', 'France', 'China']), :]

In [7]:
fig = px.line(data_frame=transformed, x="Year", y="Internet", color='Country', markers=True)
fig.show()

In [131]:
fig = px.line(data_frame=transformed, x="Year", y="Internet", color='Country', marker)
fig.show()

In [6]:
from dash import Dash, dcc, html, Input, Output
import plotly.express as px

app = Dash(__name__)


app.layout = html.Div([
    html.H4('Life expentancy progression of countries per continents'),
    dcc.Graph(id="graph"),
    dcc.Checklist(
        id="checklist",
        options=["Asia", "Europe", "Africa","Americas","Oceania"],
        value=["Americas", "Oceania"],
        inline=True
    ),
])


@app.callback(
    Output("graph", "figure"),
    Input("checklist", "value"))
def update_line_chart(continents):
    df = px.data.gapminder() # replace with your own data source
    mask = df.continent.isin(continents)
    fig = px.line(df[mask],
        x="year", y="lifeExp", color='country')
    return fig


app.run_server(debug=True)

ImportError: cannot import name 'dcc' from 'dash' (C:\Users\micha\programmes\anaconda3\lib\site-packages\dash\__init__.py)

In [41]:
fig = px.line(x=gdp_per_capita["Country Name"], y=gdp_per_capita["2010"])
fig.show()

In [43]:
gdp_per_capita.set_index(keys="Country Name", inplace=True)

In [51]:
australia = gdp_per_capita.loc["Australia", :]
australia = australia.iloc[3:]

In [52]:
australia

1960      1810.61923
1961     1877.616638
1962     1854.656834
1963     1967.116537
1964     2131.377948
            ...     
2016    49881.763714
2017    53934.250175
2018      57180.7794
2019    54875.285956
2020    51692.842748
Name: Australia, Length: 61, dtype: object

In [55]:
fig = px.line(x=australia.index, y = australia)
fig.show()

In [58]:
print(fig)

Figure({
    'data': [{'hovertemplate': 'x=%{x}<br>y=%{y}<extra></extra>',
              'legendgroup': '',
              'line': {'color': '#636efa', 'dash': 'solid'},
              'marker': {'symbol': 'circle'},
              'mode': 'lines',
              'name': '',
              'orientation': 'v',
              'showlegend': False,
              'type': 'scatter',
              'x': array(['1960', '1961', '1962', '1963', '1964', '1965', '1966', '1967', '1968',
                          '1969', '1970', '1971', '1972', '1973', '1974', '1975', '1976', '1977',
                          '1978', '1979', '1980', '1981', '1982', '1983', '1984', '1985', '1986',
                          '1987', '1988', '1989', '1990', '1991', '1992', '1993', '1994', '1995',
                          '1996', '1997', '1998', '1999', '2000', '2001', '2002', '2003', '2004',
                          '2005', '2006', '2007', '2008', '2009', '2010', '2011', '2012', '2013',
                          '2014', '201

In [69]:
fig.layout.margin.t = 60

In [70]:
fig.show()

In [71]:
fig.frames

()

In [77]:
fig.layout.width = None
fig.show()

In [78]:
df = px.data.gapminder()
df

Unnamed: 0,country,continent,year,lifeExp,pop,gdpPercap,iso_alpha,iso_num
0,Afghanistan,Asia,1952,28.801,8425333,779.445314,AFG,4
1,Afghanistan,Asia,1957,30.332,9240934,820.853030,AFG,4
2,Afghanistan,Asia,1962,31.997,10267083,853.100710,AFG,4
3,Afghanistan,Asia,1967,34.020,11537966,836.197138,AFG,4
4,Afghanistan,Asia,1972,36.088,13079460,739.981106,AFG,4
...,...,...,...,...,...,...,...,...
1699,Zimbabwe,Africa,1987,62.351,9216418,706.157306,ZWE,716
1700,Zimbabwe,Africa,1992,60.377,10704340,693.420786,ZWE,716
1701,Zimbabwe,Africa,1997,46.809,11404948,792.449960,ZWE,716
1702,Zimbabwe,Africa,2002,39.989,11926563,672.038623,ZWE,716


In [81]:
gdp_per_capita = gdp_per_capita.iloc[:,3:]

In [82]:
gdp_per_capita

Unnamed: 0_level_0,1960,1961,1962,1963,1964,1965,1966,1967,1968,1969,...,2011,2012,2013,2014,2015,2016,2017,2018,2019,2020
Country Name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Aruba,,,,,,,,,,,...,24985.013919,24712.493263,26441.619936,26893.011506,28396.908423,28452.170615,29350.805019,30253.279358,,
Africa Eastern and Southern,147.612227,147.014904,156.189192,182.243917,162.347592,180.214908,190.845484,192.337167,204.007099,227.908615,...,1770.736230,1736.166560,1713.899299,1703.596298,1549.037940,1431.778723,1573.063386,1574.978648,1530.059177,1359.618224
Afghanistan,59.773234,59.860900,58.458009,78.706429,82.095307,101.108325,137.594298,160.898434,129.108311,129.329760,...,591.190030,638.845852,624.315455,614.223342,556.007221,512.012778,516.679862,485.668419,494.179350,516.747871
Africa Western and Central,107.932233,113.081647,118.831107,123.442888,131.854402,138.526332,144.326212,128.582470,129.641106,143.715632,...,1862.308267,1965.118485,2157.481149,2212.853135,1894.310195,1673.835527,1613.473553,1704.139603,1777.918672,1710.073363
Angola,,,,,,,,,,,...,4615.468219,5100.097027,5254.881126,5408.411700,4166.979833,3506.073128,4095.810057,3289.643995,2809.626088,1776.166868
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Kosovo,,,,,,,,,,,...,3540.891789,3410.859780,3704.784221,3902.676013,3520.766449,3759.560246,4009.380987,4384.048892,4416.108358,4346.637931
"Yemen, Rep.",,,,,,,,,,,...,1374.621401,1446.536472,1607.152173,1674.002572,1601.830063,1152.720966,964.264811,758.145242,,
South Africa,443.009920,454.962013,473.011405,511.497364,548.996058,584.704163,621.220543,675.135345,711.225742,780.625919,...,8810.930651,8222.197279,7467.079185,6988.808739,6259.839681,5756.965741,6690.939847,7005.095413,6624.761865,5655.867654
Zambia,232.188564,220.042067,212.578449,213.896759,242.384473,303.281740,343.373670,360.201239,409.775349,485.872618,...,1672.907535,1763.069442,1878.346811,1762.427817,1338.290927,1280.806543,1535.196574,1516.368371,1305.001031,985.132436


In [83]:
columns = gdp_per_capita.columns
big_one = pd.DataFrame(columns=["Country", "Year"])
for column in columns:
    X =

Index(['1960', '1961', '1962', '1963', '1964', '1965', '1966', '1967', '1968',
       '1969', '1970', '1971', '1972', '1973', '1974', '1975', '1976', '1977',
       '1978', '1979', '1980', '1981', '1982', '1983', '1984', '1985', '1986',
       '1987', '1988', '1989', '1990', '1991', '1992', '1993', '1994', '1995',
       '1996', '1997', '1998', '1999', '2000', '2001', '2002', '2003', '2004',
       '2005', '2006', '2007', '2008', '2009', '2010', '2011', '2012', '2013',
       '2014', '2015', '2016', '2017', '2018', '2019', '2020'],
      dtype='object')

In [95]:
gdp_per_capita

Unnamed: 0_level_0,1960,1961,1962,1963,1964,1965,1966,1967,1968,1969,...,2011,2012,2013,2014,2015,2016,2017,2018,2019,2020
Country Name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Aruba,,,,,,,,,,,...,24985.013919,24712.493263,26441.619936,26893.011506,28396.908423,28452.170615,29350.805019,30253.279358,,
Africa Eastern and Southern,147.612227,147.014904,156.189192,182.243917,162.347592,180.214908,190.845484,192.337167,204.007099,227.908615,...,1770.736230,1736.166560,1713.899299,1703.596298,1549.037940,1431.778723,1573.063386,1574.978648,1530.059177,1359.618224
Afghanistan,59.773234,59.860900,58.458009,78.706429,82.095307,101.108325,137.594298,160.898434,129.108311,129.329760,...,591.190030,638.845852,624.315455,614.223342,556.007221,512.012778,516.679862,485.668419,494.179350,516.747871
Africa Western and Central,107.932233,113.081647,118.831107,123.442888,131.854402,138.526332,144.326212,128.582470,129.641106,143.715632,...,1862.308267,1965.118485,2157.481149,2212.853135,1894.310195,1673.835527,1613.473553,1704.139603,1777.918672,1710.073363
Angola,,,,,,,,,,,...,4615.468219,5100.097027,5254.881126,5408.411700,4166.979833,3506.073128,4095.810057,3289.643995,2809.626088,1776.166868
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Kosovo,,,,,,,,,,,...,3540.891789,3410.859780,3704.784221,3902.676013,3520.766449,3759.560246,4009.380987,4384.048892,4416.108358,4346.637931
"Yemen, Rep.",,,,,,,,,,,...,1374.621401,1446.536472,1607.152173,1674.002572,1601.830063,1152.720966,964.264811,758.145242,,
South Africa,443.009920,454.962013,473.011405,511.497364,548.996058,584.704163,621.220543,675.135345,711.225742,780.625919,...,8810.930651,8222.197279,7467.079185,6988.808739,6259.839681,5756.965741,6690.939847,7005.095413,6624.761865,5655.867654
Zambia,232.188564,220.042067,212.578449,213.896759,242.384473,303.281740,343.373670,360.201239,409.775349,485.872618,...,1672.907535,1763.069442,1878.346811,1762.427817,1338.290927,1280.806543,1535.196574,1516.368371,1305.001031,985.132436


In [89]:
big_one = pd.DataFrame(columns=["Country", "Year", "Value"])
i = 0
for column in columns:
    X = gdp_per_capita.loc[:,column]


Unnamed: 0,Country,Year


In [93]:
big_one.loc[1] = ["alicja", 100]

In [94]:
big_one.append()

Unnamed: 0,Country,Year
1,alicja,100
