From fce61d788c6897484e60e0e1b59d5c4b9c0e71e6 Mon Sep 17 00:00:00 2001
From: Vaishnavi Bhushan <96589133+VB-deeksha@users.noreply.github.com>
Date: Sun, 11 Jun 2023 12:58:54 +0530
Subject: [PATCH] Create Covid_19_data
---
Data Analytics/Covid_19_data | 507 +++++++++++++++++++++++++++++++++++
1 file changed, 507 insertions(+)
create mode 100644 Data Analytics/Covid_19_data
diff --git a/Data Analytics/Covid_19_data b/Data Analytics/Covid_19_data
new file mode 100644
index 00000000..9cc4697d
--- /dev/null
+++ b/Data Analytics/Covid_19_data
@@ -0,0 +1,507 @@
+{
+ "cells": [
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "id": "cc9cd027",
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import pandas as pd\n",
+ "import numpy as np\n",
+ "import seaborn as sns\n",
+ "import matplotlib.pyplot as plt"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "id": "2b0336a0",
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [],
+ "source": [
+ "data = pd.read_csv(r\"C:\\Users\\vaish\\OneDrive\\Documents\\Kaggle Datasets\\covid_19_dataset.csv\")"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "id": "1457edd1",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "
\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " SNo | \n",
+ " ObservationDate | \n",
+ " Province/State | \n",
+ " Country/Region | \n",
+ " Last Update Time | \n",
+ " Confirmed | \n",
+ " Deaths | \n",
+ " Recovered | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 | \n",
+ " 1 | \n",
+ " 22-01-2020 | \n",
+ " Anhui | \n",
+ " Mainland China | \n",
+ " 22-01-2020 17:00 | \n",
+ " 1 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ "
\n",
+ " \n",
+ " 1 | \n",
+ " 2 | \n",
+ " 22-01-2020 | \n",
+ " Beijing | \n",
+ " Mainland China | \n",
+ " 22-01-2020 17:00 | \n",
+ " 14 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ "
\n",
+ " \n",
+ " 2 | \n",
+ " 3 | \n",
+ " 22-01-2020 | \n",
+ " Fujian | \n",
+ " Mainland China | \n",
+ " 22-01-2020 17:00 | \n",
+ " 6 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ "
\n",
+ " \n",
+ " 3 | \n",
+ " 4 | \n",
+ " 22-01-2020 | \n",
+ " Gansu | \n",
+ " Mainland China | \n",
+ " 22-01-2020 17:00 | \n",
+ " 1 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ "
\n",
+ " \n",
+ " 4 | \n",
+ " 5 | \n",
+ " 22-01-2020 | \n",
+ " Guangdong | \n",
+ " Mainland China | \n",
+ " 22-01-2020 17:00 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ " 0 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " SNo ObservationDate Province/State Country/Region Last Update Time \\\n",
+ "0 1 22-01-2020 Anhui Mainland China 22-01-2020 17:00 \n",
+ "1 2 22-01-2020 Beijing Mainland China 22-01-2020 17:00 \n",
+ "2 3 22-01-2020 Fujian Mainland China 22-01-2020 17:00 \n",
+ "3 4 22-01-2020 Gansu Mainland China 22-01-2020 17:00 \n",
+ "4 5 22-01-2020 Guangdong Mainland China 22-01-2020 17:00 \n",
+ "\n",
+ " Confirmed Deaths Recovered \n",
+ "0 1 0 0 \n",
+ "1 14 0 0 \n",
+ "2 6 0 0 \n",
+ "3 1 0 0 \n",
+ "4 0 0 0 "
+ ]
+ },
+ "execution_count": 3,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "data.head()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "id": "030a514e",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "Index(['SNo', 'ObservationDate', 'Province/State', 'Country/Region',\n",
+ " 'Last Update Time', 'Confirmed', 'Deaths', 'Recovered'],\n",
+ " dtype='object')"
+ ]
+ },
+ "execution_count": 4,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "data.columns"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "id": "31928232",
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " | \n",
+ " SNo | \n",
+ " Confirmed | \n",
+ " Deaths | \n",
+ " Recovered | \n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " count | \n",
+ " 50.00000 | \n",
+ " 50.000000 | \n",
+ " 50.000000 | \n",
+ " 50.000000 | \n",
+ "
\n",
+ " \n",
+ " mean | \n",
+ " 25.50000 | \n",
+ " 28.240000 | \n",
+ " 0.820000 | \n",
+ " 1.280000 | \n",
+ "
\n",
+ " \n",
+ " std | \n",
+ " 14.57738 | \n",
+ " 97.839218 | \n",
+ " 4.119094 | \n",
+ " 5.838087 | \n",
+ "
\n",
+ " \n",
+ " min | \n",
+ " 1.00000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ "
\n",
+ " \n",
+ " 25% | \n",
+ " 13.25000 | \n",
+ " 1.000000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ "
\n",
+ " \n",
+ " 50% | \n",
+ " 25.50000 | \n",
+ " 4.000000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ "
\n",
+ " \n",
+ " 75% | \n",
+ " 37.75000 | \n",
+ " 14.750000 | \n",
+ " 0.000000 | \n",
+ " 0.000000 | \n",
+ "
\n",
+ " \n",
+ " max | \n",
+ " 50.00000 | \n",
+ " 549.000000 | \n",
+ " 24.000000 | \n",
+ " 31.000000 | \n",
+ "
\n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " SNo Confirmed Deaths Recovered\n",
+ "count 50.00000 50.000000 50.000000 50.000000\n",
+ "mean 25.50000 28.240000 0.820000 1.280000\n",
+ "std 14.57738 97.839218 4.119094 5.838087\n",
+ "min 1.00000 0.000000 0.000000 0.000000\n",
+ "25% 13.25000 1.000000 0.000000 0.000000\n",
+ "50% 25.50000 4.000000 0.000000 0.000000\n",
+ "75% 37.75000 14.750000 0.000000 0.000000\n",
+ "max 50.00000 549.000000 24.000000 31.000000"
+ ]
+ },
+ "execution_count": 5,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "data.describe()"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "id": "f4fa263f",
+ "metadata": {},
+ "source": [
+ "# Relating the variables with scatterplots"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "id": "5086bca7",
+ "metadata": {
+ "scrolled": true
+ },
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 6,
+ "metadata": {},
+ "output_type": "execute_result"
+ },
+ {
+ "data": {
+ "image/png": "\n",
+ "text/plain": [
+ "