-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathData Exploration.sql
More file actions
84 lines (60 loc) · 2.64 KB
/
Data Exploration.sql
File metadata and controls
84 lines (60 loc) · 2.64 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
/*
Covid 19 Data Exploration
Skills used: Joins, CTE's, Temp Tables, Windows Functions, Aggregate Functions, Creating Views, Converting Data Types
*/
Select *
From [Covid_database].[dbo].[Covid_deaths$]
Where continent is not null
order by 3,4
-- Select Data that we are going to be starting with
Select Location, date, total_cases, new_cases, total_deaths, population
From [Covid_database].[dbo].[Covid_deaths$]
Where continent is not null
order by 1,2
-- Total Cases vs Total Deaths
-- Shows likelihood of dying if you contract covid in India
Select Location, date, total_cases,total_deaths, (total_deaths/total_cases)*100 as Death_Percentage
From [Covid_database].[dbo].[Covid_deaths$]
Where location = 'India'
and continent is not null
order by 1,2
-- Total Cases vs Population
-- Shows what percentage of population infected with Covid
Select Location, date, Population, total_cases, (total_cases/population)*100 as Percent_Population_Infected
From [Covid_database].[dbo].[Covid_deaths$]
order by 1,2
-- Countries with Highest Infection Rate compared to Population
Select Location, Population, MAX(total_cases) as Highest_Infection_Count, Max((total_cases/population))*100 as Percent_Population_Infected
From [Covid_database].[dbo].[Covid_deaths$]
Group by Location, Population
order by Percent_Population_Infected desc
-- Countries with Highest Death Count per Population
Select Location, MAX(cast(Total_deaths as int)) as Total_Death_Count
From [Covid_database].[dbo].[Covid_deaths$]
Where continent is not null
Group by Location
order by Total_Death_Count desc
-- BREAKING THINGS DOWN BY CONTINENT
-- Showing contintents with the highest death count per population
Select continent, MAX(cast(Total_deaths as int)) as Total_Death_Count
From [Covid_database].[dbo].[Covid_deaths$]
Where continent is not null
Group by continent
order by Total_Death_Count desc
-- GLOBAL NUMBERS
Select SUM(new_cases) as total_cases, SUM(cast(new_deaths as int)) as total_deaths, SUM(cast(new_deaths as int))/SUM(New_Cases)*100 as Death_Percentage
From [Covid_database].[dbo].[Covid_deaths$]
where continent is not null
--Group By date
order by 1,2
-- Total Population vs Vaccinations
-- Shows Percentage of Population that has recieved at least one Covid Vaccine
Select dea.continent, dea.location, dea.date, dea.population, vac.new_vaccinations
, SUM(CONVERT(int,vac.new_vaccinations)) OVER (Partition by dea.Location Order by dea.location, dea.Date) as Rolling_People_Vaccinated
--, (Rolling_People_Vaccinated/population)*100
From Covid_deaths$ dea
Join Covid_vaccinations$ vac
on dea.location = vac.location
and dea.date = vac. date
where dea.continent is not null
order by 2,3