Skip to content

hirak-saharia/Covid-Analysis-using-SQL-Server

Folders and files

NameName
Last commit message
Last commit date

Latest commit

 

History

14 Commits
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 

Repository files navigation

Covid-Analysis-using-SQL Server Management Studio

We have imported Covid deaths and Vaccination excel files to analysis....

Queries performed....

To find the table information....

Select *From CovidAnalysis..CovidDeaths where continet is not null order by 3,4

Select * From CovidAnalysis..CovidVacciantion where continet is not null order by 3,4

-- Selected Data that we are going to be starting with

SELECT location, date, total_cases, new_cases, total_deaths, population From CovidAnalysis..CovidDeaths where continet is not null order by 1,2

-- Total Cases vs Total Deaths -- Shows likelihood of dying if you contract covid in your country

Select location, date, total_cases,total_deaths, (total_deaths/total_cases) From covidproject.coviddeaths2 order by 1,2 SELECT location, date, total_cases, total_deaths, (total_deaths/total_cases)*100 as DeathPercentage From CovidAnalysis..CovidDeaths where continet is not null order by 1,2

-- Shows likelihood of dying if you contract covid in your country >>>SELECT location, date, total_cases, total_deaths, (total_deaths/total_cases)*100 as DeathPercentage From CovidAnalysis..CovidDeaths where location like '%States%' OR where location like '%IND%' order by 1,2

--Looking at the total Cases vs Population --Shows what percentage of populations got covid

>>>SELECT location, date, population, total_cases, (total_cases/population)*100 as PercentagePopulation
From CovidAnalysis..CovidDeaths
where location like '%IND%'
order by 1,2

-- Countries with Highest Infection Rate compared to Population

SELECT location, population, MAX(total_cases) as HighestInfectionCount, MAX((total_cases/population))*100 as PercentPopulationInfected
From CovidAnalysis..CovidDeaths
--where location like '%IND%'
where continent is not null
Group by Location, Population
order by PercentPopulationInfected desc
--order by 1,2

-- Countries with Highest Death Count per Population

>>>>SELECT location, MAX(cast(total_deaths as int)) as TotalDeathsCount
FROM CovidAnalysis..CovidDeaths
where continent is not null
GROUP by location
order by TotalDeathsCount desc

--LET'S BREAK THINGS DOWN BY CONTINENT -- Showing contintents with the highest death count per population

SELECT continent, MAX(cast(total_deaths as int)) as TotalDeathsCount FROM CovidAnalysis..CovidDeaths where continent is not null GROUP by continent

---We see that number of total deaths as per the data is not matches with the Query....so we used this one istead..

SELECT location, MAX(cast(total_deaths as int)) as TotalDeathsCount FROM CovidAnalysis..CovidDeaths where continent is null GROUP by location order by TotalDeathsCount desc

---Global Numbers

SELECT date, SUM(new_cases) as New_Cases, SUM(cast(new_deaths as int)) as New_Deaths, SUM(cast(new_deaths as int))/SUM(new_cases)*100 as DeathPercentage ---total_deaths, (total_deaths/total_cases)*100 as DeathPercentage From CovidAnalysis..CovidDeaths --where location like '%IND%' where continent is not null group by date order by 1,2

--Overall Global numbers

SELECT SUM(new_cases) as New_Cases, SUM(cast(new_deaths as int)) as New_Deaths, SUM(cast(new_deaths as int))/SUM(new_cases)*100 as DeathPercentage ---total_deaths, (total_deaths/total_cases)*100 as DeathPercentage From CovidAnalysis..CovidDeaths --where location like '%IND%' where continent is not null --group by date order by 1,2

--Looking at Total Population VS Total Vaccinations

SELECT dea.continent, dea.location, dea.date, dea.population, new_vaccinations FROM CovidAnalysis..CovidDeaths dea JOIN CovidAnalysis..CovidVacciantion as vac on dea.location = vac.location and dea.date = vac.date where dea.continent is not null order by 2,3

-- Using CTE to perform Calculation on Partition By in previous query

>>>With PopvsVac (Continent, Location, Date, Population, New_Vaccinations, RollingPeopleVaccinated)
   as
   (
   SELECT dea.continent, dea.location, dea.date, dea.population, vac.new_vaccinations
   , SUM(convert(int, vac.new_vaccinations)) OVER (Partition by dea.location order by dea.location, dea.date) as RollingPeopleVacinated
   --, (RollingPeopleVacinated/population)*100
   FROM CovidAnalysis..CovidDeaths dea
   JOIN CovidAnalysis..CovidVacciantion as vac
       on dea.location = vac.location
       and dea.date = vac.date
   where dea.continent is not null
    --order by 2,3
   )
   SELECT * 
   FROM PopvsVac

---We got things that wanted for further calculation and let's calculate the Percentage of RollingPeopleVaccinates by Populations

With PopvsVac (Continent, Location, Date, Population, New_Vaccinations, RollingPeopleVaccinated)
as
(
Select dea.continent, dea.location, dea.date, dea.population, vac.new_vaccinations
, SUM(CONVERT(int,vac.new_vaccinations)) OVER (Partition by dea.Location Order by dea.location, dea.Date) as RollingPeopleVaccinated
--, (RollingPeopleVaccinated/population)*100
From CovidAnalysis..CovidDeaths dea
Join CovidAnalysis..CovidVacciantion vac
     On dea.location = vac.location
     and dea.date = vac.date
where dea.continent is not null 
--order by 2,3
)
Select *, (RollingPeopleVaccinated/Population)*100 as PercentageOfRollingPeopleVaccinated
From PopvsVac

---LET'S CREATE A TEMP TABLE...

   DROP Table if exists #PercentageOfPopulationVaccinated
   CREATE Table #PercentageOfPopulationVaccinated

   (
   Continent nvarchar (255),
   Location nvarchar (255),
   Date datetime,
   Population numeric,
   New_Vaccications numeric,
   RollingPeopleVaccinated numeric

   )
   Insert Into #PercentageOfPopulationVaccinated
   Select dea.continent, dea.location, dea.date, dea.population, vac.new_vaccinations
   , SUM(CONVERT(int,vac.new_vaccinations)) OVER (Partition by dea.Location Order by dea.location, dea.Date) as RollingPeopleVaccinated
   --, (RollingPeopleVaccinated/population)*100
   From CovidAnalysis..CovidDeaths dea
   Join CovidAnalysis..CovidVacciantion vac
        On dea.location = vac.location
        and dea.date = vac.date
   --where dea.continent is not null 
   --order by 2,3

   Select *, (RollingPeopleVaccinated/Population)*100 as PercentageOfRollingPeopleVaccinated
   From #PercentageOfPopulationVaccinated

-- Creating View to store data for later visualizations

      Create View FinalPercentPopulationVaccinated as
      Select dea.continent, dea.location, dea.date, dea.population, vac.new_vaccinations
     , SUM(CONVERT(int,vac.new_vaccinations)) OVER (Partition by dea.Location Order by dea.location, dea.Date) as RollingPeopleVaccinated
     --, (RollingPeopleVaccinated/population)*100
     From CovidAnalysis..CovidDeaths dea
     Join CovidAnalysis..CovidVacciantion vac
          On dea.location = vac.location
         and dea.date = vac.date
     where dea.continent is not null 

--To view the created table for further anysis in any BI Plateform SELECT * FROM FinalPercentPopulationVaccinated

About

No description, website, or topics provided.

Resources

Stars

Watchers

Forks

Releases

No releases published

Packages

No packages published