Project On Covid Data
Project On Covid Data
[1]:
import pandas as pd
In [2]:
data = pd.read_csv('D:\\DATA ANALYTICS\\4. covid_19_data (1).csv')
In [3]:
data
In [5]:
data.count()
State 140
Region 321
Confirmed 321
Deaths 321
Recovered 321
dtype: int64
In [6]:
data.isnull().sum()
Out[6]: Date 0
State 181
Region 0
Confirmed 0
Deaths 0
Recovered 0
dtype: int64
In [8]:
import seaborn as sns
In [12]: sns.heatmap(data.isnull())
Out[12]: <AxesSubplot:>
In [13]:
data.groupby('Region')['Confirmed','Recovered'].sum()
data.groupby('Region')['Confirmed','Recovered'].sum()
Region
Angola 27 7
Zambia 97 54
Zimbabwe 32 5
In [15]:
data = data[~(data.Confirmed < 10) ]
In [16]:
data
Out[16]:
Date State Region Confirmed Deaths Recovered
In [17]:
data.groupby('Region')['Confirmed','Recovered'].sum()
data.groupby('Region')['Confirmed','Recovered'].sum()
Region
Angola 27 7
Zambia 97 54
Zimbabwe 32 5
In [21]:
data
In [30]:
data.groupby('Region')['Deaths'].sum().sort_values(ascending = True)
Out[30]: Region
Cambodia 0
Seychelles 0
Saint Lucia 0
...
France 24121
Spain 24275
UK 26165
Italy 27682
US 60967
In [38]:
data[data.Region == 'India']
In [41]:
data.sort_values(by = ['Confirmed'])
In [ ]: