-
Notifications
You must be signed in to change notification settings - Fork 0
/
Covid 19 Portfolio Project - Data Exploration.sql
131 lines (112 loc) · 4.98 KB
/
Covid 19 Portfolio Project - Data Exploration.sql
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
/*
Covid 19 Data Exploration
Skills used: Joins, CTE's, Temp Tables, Windows Functions, Aggregate Functions, Creating Views, Converting Data Types
*/
select * from CovidDeaths
where continent is not null
order by 3,4
--select * from CovidDeaths
--order by 3,4
select location, date, total_cases, new_cases, total_deaths, population
from PorfolioProject..CovidDeaths
order by 1,2
-- Looking at Total cases vs Total Deaths
select location, date, total_cases, total_deaths, (total_deaths/total_cases)*100 as DeathPercentage
from PorfolioProject..CovidDeaths
where location like '%states%'
order by 1,2
-- Looking at Total case vs Total Population
-- Shows what percentage of population got covid
select location, date, total_cases, population, (total_cases/population)*100 as PercentPopulationInfected
from PorfolioProject..CovidDeaths
where location like '%Kenya%'
Order by 1,2
-- Looking at countries with highest infection rate compare to population
select location, MAX(total_cases) as HighestInfectionCount, MAX(total_cases/population)*100 as PercentPopulationInfected
from PorfolioProject..CovidDeaths
-- where location like '%states%'
Group by population, location
order by PercentPopulationInfected desc
--Showing countries with the highest death count per population
select location, MAX(CAST(total_deaths AS INT)) as TotalDeathCount
from PorfolioProject..CovidDeaths
where continent is not null
Group by location
order by TotalDeathCount Desc
-- Let's break things down by continent
-- Showing continents with the highest death count per population
select continent, MAX(CAST(total_deaths AS INT)) as TotalDeathCount
from PorfolioProject..CovidDeaths
where continent is not null
Group by continent
order by TotalDeathCount Desc
-- Global Numbers
select SUM(new_cases) as total_cases, SUM(CAST(new_deaths as int)) as total_deaths, SUM(CAST(new_deaths as int))/SUM(new_cases) * 100 as DeathPercentage
from PorfolioProject..CovidDeaths
where continent is not null
-- Group By date
order by 1, 2
select date, SUM(new_cases) as total_cases, SUM(CAST(new_deaths as int)) as total_deaths, SUM(CAST(new_deaths as int))/SUM(new_cases) * 100 as DeathPercentage
from PorfolioProject..CovidDeaths
where continent is not null
Group By date
order by 1, 2
-- Looking at Total Population vs Vaccinations
select deaths.continent, deaths.location, deaths.date, deaths.population, vaccinations.new_vaccinations,
SUM(CAST(vaccinations.new_vaccinations as int)) OVER (Partition by deaths.location order by deaths.location, deaths.date) as RollingPeopleVaccinated
FROM PorfolioProject..CovidDeaths deaths
Join PorfolioProject..CovidVaccinations vaccinations
on deaths.location = vaccinations.location
and deaths.date = vaccinations.date
where deaths.continent is not null
order by 2,3
-- Create a CTE
WITH PopVsVac(continent,location, date,population,new_vaccinations,RollingPeopleVaccinated)
as
(
select deaths.continent, deaths.location, deaths.date, deaths.population, vaccinations.new_vaccinations,
SUM(CAST(vaccinations.new_vaccinations as int)) OVER (Partition by deaths.location order by deaths.location, deaths.date) as RollingPeopleVaccinated
FROM PorfolioProject..CovidDeaths deaths
Join PorfolioProject..CovidVaccinations vaccinations
on deaths.location = vaccinations.location
and deaths.date = vaccinations.date
where deaths.continent is not null
-- order by 2,3
)
select *,(RollingPeopleVaccinated/population)*100 as VaccinatedPercentage
from PopVsVac
-- Create Temp table
Drop Table if Exists #PercentPopVaccinated
Create Table #PercentPopVaccinated
(
Continent nvarchar(255),
Location nvarchar(255),
Date Datetime,
Population numeric,
New_vaccinations numeric,
RollingPeopleVaccinated bigint
)
Insert into #PercentPopVaccinated
select deaths.continent, deaths.location, deaths.date, deaths.population, vaccinations.new_vaccinations,
SUM(CAST(vaccinations.new_vaccinations as bigint)) OVER (Partition by deaths.location order by deaths.location, deaths.date) as RollingPeopleVaccinated
FROM PorfolioProject..CovidDeaths deaths
Join PorfolioProject..CovidVaccinations vaccinations
on deaths.location = vaccinations.location
and deaths.date = vaccinations.date
--where deaths.continent is not null
-- order by 2,3
select *,(RollingPeopleVaccinated/population)*100 as VaccinatedPercentage
from #PercentPopVaccinated
-- Creating view to store data for later visualizations
Create view PercentPopulationVaccinated
as
select deaths.continent, deaths.location, deaths.date, deaths.population, vaccinations.new_vaccinations,
SUM(CAST(vaccinations.new_vaccinations as bigint)) OVER (Partition by deaths.location order by deaths.location, deaths.date) as RollingPeopleVaccinated
FROM PorfolioProject..CovidDeaths deaths
Join PorfolioProject..CovidVaccinations vaccinations
on deaths.location = vaccinations.location
and deaths.date = vaccinations.date
where deaths.continent is not null
-- order by 2,3
select *
from PercentPopulationVaccinated