In [13]:
library(tidyverse)
library(tidyr)

In [14]:
egdi <- read.csv('EGOV_DATA_2024.csv') %>%
    select(Country.Name, Telecommunication.Infrastructure.Index) %>%
    arrange(Country.Name)

In [15]:
countries <- unique(egdi$Country.Name)

In [16]:
gdp <- read.csv('pib_percapita_ppc.csv') %>%
    select(Country.Name, X2024) %>%
    arrange(Country.Name) %>% 
    replace_na(list(X2024 = 0))

In [17]:
setdiff(egdi$Country.Name, gdp$Country.Name)

In [18]:
gdp <- gdp %>% 
    mutate(Country.Name = case_when(
        Country.Name == 'Bahamas, The' ~ 'Bahamas',
        Country.Name == 'Congo, Rep.' ~ 'Congo',
        Country.Name == 'Czechia' ~ 'Czech Republic',
        Country.Name == 'Cote d\'Ivoire' ~ 'Côte d\'Ivoire',
        Country.Name == 'Egypt, Arab Rep.' ~ 'Egypt',
        Country.Name == 'Gambia, The' ~ 'Gambia',
        Country.Name == 'Georgia' ~ 'Georgia (Country)',
        Country.Name == 'Micronesia, Fed. Sts.' ~ 'Micronesia (Federated States of)',
        Country.Name == 'Turkiye' ~ 'Türkiye',
        Country.Name == 'Iran, Islamic Rep.' ~ 'Iran (Islamic Republic of)',
        Country.Name == 'Congo, Dem. Rep.' ~ 'Democratic Republic of the Congo',
        Country.Name == 'Korea, Rep.' ~ 'Republic of Korea',
        Country.Name == 'Moldova' ~ 'Republic of Moldova',
        Country.Name == 'Korea, Dem. People\'s Rep.' ~ 'Democratic People\'s Republic of Korea',
        Country.Name == 'Slovak Republic' ~ 'Slovakia',
        Country.Name == 'St. Kitts and Nevis' ~ 'Saint Kitts and Nevis',
        Country.Name == 'St. Lucia' ~ 'Saint Lucia',
        Country.Name == 'St. Vincent and the Grenadines' ~ 'Saint Vincent and the Grenadines',
        Country.Name == 'Yemen, Rep.' ~ 'Yemen',
        Country.Name == 'Venezuela, RB' ~ 'Venezuela',
        Country.Name == 'United Kingdom' ~ 'United Kingdom of Great Britain and Northern Ireland',
        Country.Name == 'Tanzania' ~ 'United Republic of Tanzania',
        Country.Name == 'United States' ~ 'United States of America',
        Country.Name == 'Lao PDR' ~ 'Lao People\'s Democratic Republic',
        Country.Name == 'Kyrgyz Republic' ~ 'Kyrgyzstan',
        TRUE ~ Country.Name
    )) %>%
    filter(Country.Name %in% egdi$Country.Name) %>%
    arrange(Country.Name)

In [19]:
setdiff(egdi$Country.Name, gdp$Country.Name)

In [20]:
length(gdp$Country.Name)

In [21]:
df <- data.frame(
    egdi = egdi$Telecommunication.Infrastructure.Index,
    gdp = gdp$X2024
)

In [22]:
final_plot <- ggplot(df, aes(x = egdi, y = gdp)) +
    geom_point() +
    geom_smooth(method = 'lm') +
    labs(
        x = 'TCI',
        y = 'PIB per capita PPC'
    ) +
    coord_cartesian(xlim = c(0, 1))

In [23]:
ggsave(
    'C:/Users/lazar/Master-Dissertation/figuras/relacao_tci_pib_percapita_ppc.png', 
    dpi=300,
    width = 25.4,
    height = 15.24,
    units = "cm"
)

[1m[22m`geom_smooth()` using formula = 'y ~ x'
