-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathcovid19SQL.sql
More file actions
116 lines (101 loc) · 4.33 KB
/
covid19SQL.sql
File metadata and controls
116 lines (101 loc) · 4.33 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
/*
Covid 19 Data Exploration in MySQL
Skills used: Joins, CTEs, Temp Tables, Window Functions, Aggregate Functions, Creating Views, Converting Data Types
*/
-- Select all data from CovidDeaths table
SELECT *
FROM coviddata.coviddeaths
WHERE continent IS NOT NULL
ORDER BY 3,4;
-- Selecting necessary columns for initial data exploration
SELECT location, date, total_cases, new_cases, total_deaths, population
FROM coviddata.coviddeaths
WHERE continent IS NOT NULL
ORDER BY 1,2;
-- Total Cases vs Total Deaths (Likelihood of dying if infected)
SELECT location, date, total_cases, total_deaths,
(total_deaths / total_cases) * 100 AS DeathPercentage
FROM coviddata.coviddeaths
WHERE location LIKE '%states%'
AND continent IS NOT NULL
ORDER BY 1,2;
-- Total Cases vs Population (Percentage of population infected)
SELECT location, date, population, total_cases,
(total_cases / population) * 100 AS PercentPopulationInfected
FROM coviddata.coviddeaths
ORDER BY 1,2;
-- Countries with Highest Infection Rate compared to Population
SELECT location, population, MAX(total_cases) AS HighestInfectionCount,
MAX((total_cases / population) * 100) AS PercentPopulationInfected
FROM coviddata.coviddeaths
GROUP BY location, population
ORDER BY PercentPopulationInfected DESC;
-- Countries with Highest Death Count per Population
SELECT location, MAX(CAST(total_deaths AS UNSIGNED)) AS TotalDeathCount
FROM coviddata.coviddeaths
WHERE continent IS NOT NULL
GROUP BY location
ORDER BY TotalDeathCount DESC;
-- Breaking down by Continent - Highest death count per population
SELECT continent, MAX(CAST(total_deaths AS UNSIGNED)) AS TotalDeathCount
FROM coviddata.coviddeaths
WHERE continent IS NOT NULL
GROUP BY continent
ORDER BY TotalDeathCount DESC;
-- Global Numbers (Total Cases, Total Deaths, Death Percentage)
SELECT SUM(new_cases) AS total_cases,
SUM(CAST(new_deaths AS UNSIGNED)) AS total_deaths,
(SUM(CAST(new_deaths AS UNSIGNED)) / SUM(new_cases)) * 100 AS DeathPercentage
FROM coviddata.coviddeaths
WHERE continent IS NOT NULL
ORDER BY 1,2;
-- Total Population vs Vaccinations
-- Shows percentage of population that has received at least one vaccine dose
SELECT dea.continent, dea.location, dea.date, dea.population, vac.new_vaccinations,
SUM(vac.new_vaccinations) OVER (PARTITION BY dea.location ORDER BY dea.date) AS RollingPeopleVaccinated
FROM coviddata.coviddeaths dea
JOIN coviddata.covidvaccinations vac
ON dea.location = vac.location
AND dea.date = vac.date
WHERE dea.continent IS NOT NULL
ORDER BY 2,3;
-- Using CTE to perform calculation with Partition By
WITH PopvsVac AS (
SELECT dea.continent, dea.location, dea.date, dea.population, vac.new_vaccinations,
SUM(vac.new_vaccinations) OVER (PARTITION BY dea.location ORDER BY dea.date) AS RollingPeopleVaccinated
FROM coviddata.coviddeaths dea
JOIN coviddata.covidvaccinations vac
ON dea.location = vac.location
AND dea.date = vac.date
WHERE dea.continent IS NOT NULL
)
SELECT *, (RollingPeopleVaccinated / population) * 100 AS PercentPopulationVaccinated
FROM PopvsVac;
-- Using Temporary Table for calculations
DROP TEMPORARY TABLE IF EXISTS PercentPopulationVaccinated;
CREATE TEMPORARY TABLE PercentPopulationVaccinated (
Continent VARCHAR(255),
Location VARCHAR(255),
Date DATE,
Population BIGINT,
New_vaccinations BIGINT,
RollingPeopleVaccinated BIGINT
);
INSERT INTO PercentPopulationVaccinated
SELECT dea.continent, dea.location, dea.date, dea.population, vac.new_vaccinations,
SUM(vac.new_vaccinations) OVER (PARTITION BY dea.location ORDER BY dea.date) AS RollingPeopleVaccinated
FROM coviddata.coviddeaths dea
JOIN coviddata.covidvaccinations vac
ON dea.location = vac.location
AND dea.date = vac.date;
SELECT *, (RollingPeopleVaccinated / Population) * 100 AS PercentPopulationVaccinated
FROM PercentPopulationVaccinated;
-- Creating a View for later visualizations
CREATE OR REPLACE VIEW PercentPopulationVaccinated AS
SELECT dea.continent, dea.location, dea.date, dea.population, vac.new_vaccinations,
SUM(vac.new_vaccinations) OVER (PARTITION BY dea.location ORDER BY dea.date) AS RollingPeopleVaccinated
FROM coviddata.coviddeaths dea
JOIN coviddata.covidvaccinations vac
ON dea.location = vac.location
AND dea.date = vac.date
WHERE dea.continent IS NOT NULL;percentpopulationvaccinated2