0% found this document useful (0 votes)

9 views11 pages

Covid 19 Analysis and Visualization Using Plotly Express

The document outlines data analysis and manipulation using Python libraries such as Plotly and Pandas, focusing on COVID-19 datasets. It describes two datasets: 'dataset1' with 209 rows and 17 columns, and 'dataset2' with 35,156 rows and multiple fields related to COVID-19 statistics. The document includes information on data types, unique values, and sample data for each column in the datasets.

Uploaded by

fvdhmjtdzcpbchsduk

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

9 views11 pages

Covid 19 Analysis and Visualization Using Plotly Express

Uploaded by

fvdhmjtdzcpbchsduk

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 11

# Data analysis and Manipulation

import plotly.graph_objs as go
import plotly.io as pio
import plotly.express as px
import pandas as pd

# Data Visualization
import matplotlib.pyplot as plt

# Importing Plotly
import plotly.offline as py
py.init_notebook_mode(connected=True)

# Initializing Plotly
pio.renderers.default = 'colab'

# Importing Dataset1
dataset1 = pd.read_csv("covid.csv")
dataset1.head() # returns first 5 rows

{"summary":"{\n \"name\": \"dataset1\",\n \"rows\": 209,\n

\"fields\": [\n {\n \"column\": \"Country/Region\",\n
\"properties\": {\n \"dtype\": \"string\",\n
\"num_unique_values\": 209,\n \"samples\": [\n
\"Oman\",\n \"Martinique\",\n \"French Guiana\"\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"Continent\",\n
\"properties\": {\n \"dtype\": \"category\",\n
\"num_unique_values\": 6,\n \"samples\": [\n \"North
America\",\n \"South America\",\n
\"Australia/Oceania\"\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"Population\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 104766099.48117349,\n \"min\":
801.0,\n \"max\": 1381344997.0,\n \"num_unique_values\":
208,\n \"samples\": [\n 23821199.0,\n
60452568.0,\n 5794279.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"TotalCases\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
432586,\n \"min\": 10,\n \"max\": 5032179,\n
\"num_unique_values\": 206,\n \"samples\": [\n
249204,\n 354530,\n 17\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"NewCases\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\":
3129.611424229319,\n \"min\": 20.0,\n \"max\": 6590.0,\n
\"num_unique_values\": 4,\n \"samples\": [\n 1282.0,\n
30.0,\n 6590.0\n ],\n \"semantic_type\": \"\",\
n \"description\": \"\"\n }\n },\n {\n
\"column\": \"TotalDeaths\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 15487.184877168185,\n
\"min\": 1.0,\n \"max\": 162804.0,\n
\"num_unique_values\": 150,\n \"samples\": [\n 617.0,\
n 9252.0,\n 5.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"NewDeaths\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
451.1995124110841,\n \"min\": 1.0,\n \"max\": 819.0,\n
\"num_unique_values\": 3,\n \"samples\": [\n 819.0,\n
80.0,\n 1.0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"TotalRecovered\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 256698.40689838002,\n \"min\":
7.0,\n \"max\": 2576668.0,\n \"num_unique_values\":
201,\n \"samples\": [\n 652.0,\n 99852.0,\n
40539.0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"NewRecovered\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 2154.779803135346,\n \"min\":
42.0,\n \"max\": 4140.0,\n \"num_unique_values\": 3,\n
\"samples\": [\n 4140.0,\n 936.0,\n 42.0\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"ActiveCases\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
174632.7369279219,\n \"min\": 0.0,\n \"max\":
2292707.0,\n \"num_unique_values\": 180,\n \"samples\":
[\n 50473.0,\n 37559.0,\n 17.0\n ],\
n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"Serious,Critical\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
2047.5186133519667,\n \"min\": 1.0,\n \"max\": 18296.0,\
n \"num_unique_values\": 74,\n \"samples\": [\n
539.0,\n 11.0,\n 384.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"Tot Cases/1M pop\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
5191.986456701242,\n \"min\": 3.0,\n \"max\": 39922.0,\n
\"num_unique_values\": 202,\n \"samples\": [\n
1317.0,\n 4122.0,\n 15769.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"Deaths/1M pop\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
174.9568620893644,\n \"min\": 0.08,\n \"max\": 1238.0,\n
\"num_unique_values\": 107,\n \"samples\": [\n 38.0,\n
214.0,\n 162.0\n ],\n \"semantic_type\": \"\",\
n \"description\": \"\"\n }\n },\n {\n
\"column\": \"TotalTests\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 5553366.67043168,\n
\"min\": 61.0,\n \"max\": 63139605.0,\n
\"num_unique_values\": 190,\n \"samples\": [\n
1183.0,\n 4238.0,\n 29233.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"Tests/1M pop\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
152730.59123995784,\n \"min\": 4.0,\n \"max\":
995282.0,\n \"num_unique_values\": 190,\n \"samples\":
[\n 22050.0,\n 3209.0,\n 11485.0\
n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\": \"WHO
Region\",\n \"properties\": {\n \"dtype\": \"category\",\n
\"num_unique_values\": 6,\n \"samples\": [\n
\"Americas\",\n \"South-EastAsia\",\n
\"WesternPacific\"\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"iso_alpha\",\n \"properties\": {\n \"dtype\":
\"string\",\n \"num_unique_values\": 193,\n \"samples\":
[\n \"HND\",\n \"TGO\",\n \"MKD\"\
n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n }\n ]\
n}","type":"dataframe","variable_name":"dataset1"}

# Returns tuple of shape (Rows, columns)

print(dataset1.shape)

# Returns size of dataframe

print(dataset1.size)

(209, 17)
3553

# Information about Dataset1

# return concise summary of dataframe
dataset1.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 209 entries, 0 to 208
Data columns (total 17 columns):
# Column Non-Null Count Dtype
--- ------ -------------- -----
0 Country/Region 209 non-null object
1 Continent 208 non-null object
2 Population 208 non-null float64
3 TotalCases 209 non-null int64
4 NewCases 4 non-null float64
5 TotalDeaths 188 non-null float64
6 NewDeaths 3 non-null float64
7 TotalRecovered 205 non-null float64
8 NewRecovered 3 non-null float64
9 ActiveCases 205 non-null float64
10 Serious,Critical 122 non-null float64
11 Tot Cases/1M pop 208 non-null float64
12 Deaths/1M pop 187 non-null float64
13 TotalTests 191 non-null float64
14 Tests/1M pop 191 non-null float64
15 WHO Region 184 non-null object
16 iso_alpha 209 non-null object
dtypes: float64(12), int64(1), object(4)
memory usage: 27.9+ KB

# Importing Dataset2
dataset2 = pd.read_csv("covid_grouped.csv")
dataset2.head() # return first 5 rows of dataset2

{"summary":"{\n \"name\": \"dataset2\",\n \"rows\": 35156,\n

\"fields\": [\n {\n \"column\": \"Date\",\n
\"properties\": {\n \"dtype\": \"object\",\n
\"num_unique_values\": 188,\n \"samples\": [\n \"2020-
07-23\",\n \"2020-07-02\",\n \"2020-02-09\"\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"Country/Region\",\n
\"properties\": {\n \"dtype\": \"category\",\n
\"num_unique_values\": 187,\n \"samples\": [\n
\"Zambia\",\n \"Iceland\",\n \"Eritrea\"\
n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"Confirmed\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 149981,\n \"min\": 0,\n
\"max\": 4290259,\n \"num_unique_values\": 10732,\n
\"samples\": [\n 2913,\n 29767,\n 169425\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"Deaths\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 7437,\n
\"min\": 0,\n \"max\": 148011,\n \"num_unique_values\":
3598,\n \"samples\": [\n 6679,\n 312,\n
34854\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"Recovered\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 64546,\n \"min\": 0,\n
\"max\": 1846641,\n \"num_unique_values\": 7649,\n
\"samples\": [\n 5223,\n 67309,\n 1303\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"Active\",\n \"properties\":
{\n \"dtype\": \"number\",\n \"std\": 89971,\n
\"min\": -2,\n \"max\": 2816444,\n
\"num_unique_values\": 8440,\n \"samples\": [\n 441,\n
46057,\n 1706\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\": \"New
cases\",\n \"properties\": {\n \"dtype\": \"number\",\n
\"std\": 3005,\n \"min\": 0,\n \"max\": 77255,\n
\"num_unique_values\": 2800,\n \"samples\": [\n 1496,\
n 1684,\n 4288\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"New deaths\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
115,\n \"min\": -1918,\n \"max\": 3887,\n
\"num_unique_values\": 715,\n \"samples\": [\n 839,\n
587,\n 35\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\": \"New
recovered\",\n \"properties\": {\n \"dtype\": \"number\",\
n \"std\": 2068,\n \"min\": -16298,\n \"max\":
140050,\n \"num_unique_values\": 2276,\n \"samples\": [\
n 26784,\n 1629,\n 2390\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"WHO Region\",\n
\"properties\": {\n \"dtype\": \"category\",\n
\"num_unique_values\": 6,\n \"samples\": [\n \"Eastern
Mediterranean\",\n \"Europe\",\n \"South-East
Asia\"\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"iso_alpha\",\n \"properties\": {\n \"dtype\":
\"category\",\n \"num_unique_values\": 179,\n
\"samples\": [\n \"IDN\",\n \"BEL\",\n
\"GRC\"\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n }\n ]\
n}","type":"dataframe","variable_name":"dataset2"}

# Returns tuple of shape (Rows, columns)

print(dataset2.shape)

# Returns size of dataframe

print(dataset2.size)

(35156, 11)
386716

# Information about Dataset2

dataset2.info() # return concise summary of dataframe

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 35156 entries, 0 to 35155
Data columns (total 11 columns):
# Column Non-Null Count Dtype
--- ------ -------------- -----
0 Date 35156 non-null object
1 Country/Region 35156 non-null object
2 Confirmed 35156 non-null int64
3 Deaths 35156 non-null int64
4 Recovered 35156 non-null int64
5 Active 35156 non-null int64
6 New cases 35156 non-null int64
7 New deaths 35156 non-null int64
8 New recovered 35156 non-null int64
9 WHO Region 35156 non-null object
10 iso_alpha 35156 non-null object
dtypes: int64(7), object(4)
memory usage: 3.0+ MB

# Columns labels of a Dataset1

dataset1.columns

Index(['Country/Region', 'Continent', 'Population', 'TotalCases',

'NewCases',
'TotalDeaths', 'NewDeaths', 'TotalRecovered', 'NewRecovered',
'ActiveCases', 'Serious,Critical', 'Tot Cases/1M pop',
'Deaths/1M pop',
'TotalTests', 'Tests/1M pop', 'WHO Region', 'iso_alpha'],
dtype='object')

# Drop NewCases, NewDeaths, NewRecovered rows from dataset1

dataset1.drop(['NewCases', 'NewDeaths', 'NewRecovered'],

axis=1, inplace=True)

# Select random set of values from dataset1

dataset1.sample(5)

{"summary":"{\n \"name\": \"dataset1\",\n \"rows\": 5,\n

\"fields\": [\n {\n \"column\": \"Country/Region\",\n
\"properties\": {\n \"dtype\": \"string\",\n
\"num_unique_values\": 5,\n \"samples\": [\n
\"Monaco\",\n \"Cambodia\",\n \"UK\"\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"Continent\",\n
\"properties\": {\n \"dtype\": \"category\",\n
\"num_unique_values\": 2,\n \"samples\": [\n
\"Europe\",\n \"Asia\"\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"Population\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
112103852.12999673,\n \"min\": 39270.0,\n \"max\":
273808365.0,\n \"num_unique_values\": 5,\n \"samples\":
[\n 39270.0,\n 16741375.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"TotalCases\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
364585,\n \"min\": 125,\n \"max\": 871894,\n
\"num_unique_values\": 5,\n \"samples\": [\n 125,\n
243\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"TotalDeaths\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 20744.13393387795,\n \"min\":
4.0,\n \"max\": 46413.0,\n \"num_unique_values\": 4,\n
\"samples\": [\n 4.0,\n 14606.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"TotalRecovered\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
327457.78123637557,\n \"min\": 105.0,\n \"max\":
676357.0,\n \"num_unique_values\": 4,\n \"samples\": [\n
105.0,\n 210.0\n ],\n \"semantic_type\": \"\",\
n \"description\": \"\"\n }\n },\n {\n
\"column\": \"ActiveCases\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 86034.73581980323,\n
\"min\": 16.0,\n \"max\": 180931.0,\n
\"num_unique_values\": 4,\n \"samples\": [\n 16.0,\n
33.0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"Serious,Critical\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 1137.8327352178496,\n \"min\":
1.0,\n \"max\": 2300.0,\n \"num_unique_values\": 4,\n
\"samples\": [\n 73.0,\n 1.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"Tot Cases/1M pop\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
2578.188569519305,\n \"min\": 15.0,\n \"max\": 5974.0,\n
\"num_unique_values\": 5,\n \"samples\": [\n 3183.0,\n
15.0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"Deaths/1M pop\",\n \"properties\": {\n \"dtype\":
\"number\",\n \"std\": 306.88583653643366,\n \"min\":
20.0,\n \"max\": 683.0,\n \"num_unique_values\": 4,\n
\"samples\": [\n 102.0,\n 100.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"TotalTests\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
13350218.542872969,\n \"min\": 38209.0,\n \"max\":
29716907.0,\n \"num_unique_values\": 5,\n \"samples\":
[\n 38209.0,\n 67807.0\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"Tests/1M pop\",\n
\"properties\": {\n \"dtype\": \"number\",\n \"std\":
399185.0325654758,\n \"min\": 4050.0,\n \"max\":
972982.0,\n \"num_unique_values\": 5,\n \"samples\": [\n
972982.0,\n 4050.0\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"WHO Region\",\n \"properties\": {\n
\"dtype\": \"string\",\n \"num_unique_values\": 3,\n
\"samples\": [\n \"South-EastAsia\",\n \"Europe\"\n
],\n \"semantic_type\": \"\",\n \"description\": \"\"\n
}\n },\n {\n \"column\": \"iso_alpha\",\n
\"properties\": {\n \"dtype\": \"string\",\n
\"num_unique_values\": 5,\n \"samples\": [\n \"MCO\",\
n \"KHM\"\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n }\n ]\n}","type":"dataframe"}

# Import create_table Figure Factory

from plotly.figure_factory import create_table

colorscale = [[0, '#4d004c'], [.5, '#f2e5ff'], [1, '#ffffff']]

table = create_table(dataset1.head(15), colorscale=colorscale)
py.iplot(table)

px.bar(dataset1.head(15), x = 'Country/Region',
y = 'TotalCases',color = 'TotalCases',
height = 500,hover_data = ['Country/Region', 'Continent'])

px.bar(dataset1.head(15), x = 'Country/Region', y = 'TotalCases',

color = 'TotalDeaths', height = 500,
hover_data = ['Country/Region', 'Continent'])

px.bar(dataset1.head(15), x = 'Country/Region', y = 'TotalCases',

color = 'TotalDeaths', height = 500,
hover_data = ['Country/Region', 'Continent'])

px.bar(dataset1.head(15), x = 'Country/Region', y = 'TotalCases',

color = 'TotalTests', height = 500, hover_data =
['Country/Region', 'Continent'])

px.bar(dataset1.head(15), x = 'TotalTests', y = 'Country/Region',

color = 'TotalTests',orientation ='h', height = 500,
hover_data = ['Country/Region', 'Continent'])

px.bar(dataset1.head(15), x = 'TotalTests', y = 'Continent',

color = 'TotalTests',orientation ='h', height = 500,
hover_data = ['Country/Region', 'Continent'])

px.scatter(dataset1, x='Continent',y='TotalCases',
hover_data=['Country/Region', 'Continent'],
color='TotalCases', size='TotalCases', size_max=80)

px.scatter(dataset1.head(54), x='Continent',y='TotalTests',
hover_data=['Country/Region', 'Continent'],
color='TotalTests', size='TotalTests', size_max=80)

px.scatter(dataset1.head(50), x='Continent',y='TotalTests',
hover_data=['Country/Region', 'Continent'],
color='TotalTests', size='TotalTests', size_max=80,
log_y=True)
px.scatter(dataset1.head(10), x='Country/Region', y= 'TotalDeaths',
hover_data=['Country/Region', 'Continent'],
color='Country/Region', size= 'TotalDeaths', size_max=80)

px.scatter(dataset1.head(30), x='Country/Region', y= 'Tests/1M pop',

hover_data=['Country/Region', 'Continent'],
color='Country/Region', size= 'Tests/1M pop', size_max=80)

px.scatter(dataset1.head(30), x='Country/Region', y= 'Tests/1M pop',

hover_data=['Country/Region', 'Continent'],
color='Tests/1M pop', size= 'Tests/1M pop', size_max=80)

px.scatter(dataset1.head(30), x='TotalCases', y= 'TotalDeaths',

hover_data=['Country/Region', 'Continent'],
color='TotalDeaths', size= 'TotalDeaths', size_max=80)

px.scatter(dataset1.head(30), x='TotalCases', y= 'TotalDeaths',

hover_data=['Country/Region', 'Continent'],
color='TotalDeaths', size= 'TotalDeaths', size_max=80,
log_x=True, log_y=True)

px.scatter(dataset1.head(30), x='TotalTests', y= 'TotalCases',

hover_data=['Country/Region', 'Continent'],
color='TotalTests', size= 'TotalTests', size_max=80,
log_x=True, log_y=True)

px.bar(df_US, x="Date", y="Confirmed", color="Confirmed", height=400)

px.bar(df_US,x="Date", y="Recovered", color="Recovered", height=400)

px.line(df_US,x="Date", y="Recovered", height=400)

px.line(df_US,x="Date", y="Deaths", height=400)

px.line(df_US,x="Date", y="Confirmed", height=400)

px.line(df_US,x="Date", y="New cases", height=400)

px.bar(df_US,x="Date", y="New cases", height=400)

px.scatter(df_US, x="Confirmed", y="Deaths", height=400)

px.choropleth(dataset2,
locations="iso_alpha",
color="Confirmed",
hover_name="Country/Region",
color_continuous_scale="Blues",
animation_frame="Date")

px.choropleth(dataset2,
locations='iso_alpha',
color="Deaths",
hover_name="Country/Region",
color_continuous_scale="Viridis",
animation_frame="Date" )

px.choropleth(dataset2,
locations='iso_alpha',
color="Recovered",
hover_name="Country/Region",
color_continuous_scale="RdYlGn",
projection="natural earth",
animation_frame="Date" )

px.bar(dataset2, x="WHO Region", y="Confirmed", color="WHO Region",

animation_frame="Date", hover_name="Country/Region")

dataset3= pd.read_csv("coviddeath.csv")
dataset3.head()

{"summary":"{\n \"name\": \"dataset3\",\n \"rows\": 12260,\n

\"fields\": [\n {\n \"column\": \"Data as of\",\n
\"properties\": {\n \"dtype\": \"object\",\n
\"num_unique_values\": 1,\n \"samples\": [\n
\"08/30/2020\"\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"Start Week\",\n \"properties\": {\n \"dtype\":
\"object\",\n \"num_unique_values\": 1,\n \"samples\":
[\n \"02/01/2020\"\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"End Week\",\n \"properties\": {\n \"dtype\":
\"object\",\n \"num_unique_values\": 1,\n \"samples\":
[\n \"08/29/2020\"\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n },\n {\n
\"column\": \"State\",\n \"properties\": {\n \"dtype\":
\"category\",\n \"num_unique_values\": 54,\n
\"samples\": [\n \"LA\"\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"Condition Group\",\n
\"properties\": {\n \"dtype\": \"category\",\n
\"num_unique_values\": 12,\n \"samples\": [\n \"All
other conditions and causes (residual)\"\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"Condition\",\n
\"properties\": {\n \"dtype\": \"category\",\n
\"num_unique_values\": 23,\n \"samples\": [\n
\"Diabetes\"\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"ICD10_codes\",\n \"properties\": {\n \"dtype\":
\"category\",\n \"num_unique_values\": 23,\n
\"samples\": [\n \"E10-E14\"\n ],\n
\"semantic_type\": \"\",\n \"description\": \"\"\n }\
n },\n {\n \"column\": \"Age Group\",\n
\"properties\": {\n \"dtype\": \"category\",\n
\"num_unique_values\": 10,\n \"samples\": [\n \"Not
stated\"\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"Number of COVID-19 Deaths\",\n \"properties\": {\n
\"dtype\": \"number\",\n \"std\": 3411.6853195964054,\n
\"min\": 0.0,\n \"max\": 169044.0,\n
\"num_unique_values\": 1022,\n \"samples\": [\n
5915.0\n ],\n \"semantic_type\": \"\",\n
\"description\": \"\"\n }\n },\n {\n \"column\":
\"Flag\",\n \"properties\": {\n \"dtype\": \"category\",\n
\"num_unique_values\": 1,\n \"samples\": [\n \"Counts
less than 10 suppressed.\"\n ],\n \"semantic_type\":
\"\",\n \"description\": \"\"\n }\n }\n ]\
n}","type":"dataframe","variable_name":"dataset3"}

dataset3.tail()

{"repr_error":"0","type":"dataframe"}

Sales - Project - v3 (2) .Ipynb
No ratings yet
Sales - Project - v3 (2) .Ipynb
1,230 pages
Exp 1 A
No ratings yet
Exp 1 A
5 pages
It, Culture, and The Society
78% (9)
It, Culture, and The Society
17 pages
Kidney Ipynb
No ratings yet
Kidney Ipynb
253 pages
Time Series Forecasting Jupyter Code - Ipynb
No ratings yet
Time Series Forecasting Jupyter Code - Ipynb
2,484 pages
Another Copy of Ensemble Models Original Paid
No ratings yet
Another Copy of Ensemble Models Original Paid
51 pages
Kidney Disease Prediction - Ipynb
No ratings yet
Kidney Disease Prediction - Ipynb
148 pages
Information Security Fundamental Weaknesses Place EPA Data and Operations at Risk 1st Edition by Government Accountability Office ISBN 1508400784 9781508400783 Instant Download
100% (6)
Information Security Fundamental Weaknesses Place EPA Data and Operations at Risk 1st Edition by Government Accountability Office ISBN 1508400784 9781508400783 Instant Download
75 pages
Covid Project
No ratings yet
Covid Project
87 pages
BD WPS2
No ratings yet
BD WPS2
23 pages
Project 04 - Data Analysis of Covid-19.ipynb
No ratings yet
Project 04 - Data Analysis of Covid-19.ipynb
73 pages
ADS LAB Merged
No ratings yet
ADS LAB Merged
86 pages
RegresiÃ N Lineal Con Python - Ipynb
No ratings yet
RegresiÃ N Lineal Con Python - Ipynb
83 pages
VoThaiThaoNhi ECON209 F2024 Lab 2
No ratings yet
VoThaiThaoNhi ECON209 F2024 Lab 2
10 pages
Vedant, Aiml
No ratings yet
Vedant, Aiml
63 pages
Project Report of RICHA
No ratings yet
Project Report of RICHA
31 pages
IS - Extended - Project - Guided - Template - Notebook
No ratings yet
IS - Extended - Project - Guided - Template - Notebook
26 pages
Import As Import As Import As Import: Pandas PD Numpy NP Matplotlib - Pyplot PLT Sklearn DF PD - Read - CSV DF
No ratings yet
Import As Import As Import As Import: Pandas PD Numpy NP Matplotlib - Pyplot PLT Sklearn DF PD - Read - CSV DF
9 pages
Arima Text
No ratings yet
Arima Text
49 pages
Merged
No ratings yet
Merged
35 pages
Implementing OLS Regression On Boston Housing Secondary Dataset. Also Check The Data For Missing Values and Outliers.
No ratings yet
Implementing OLS Regression On Boston Housing Secondary Dataset. Also Check The Data For Missing Values and Outliers.
26 pages
Data Science Code
No ratings yet
Data Science Code
29 pages
ML Lab-1
No ratings yet
ML Lab-1
5 pages
# Importing Necessary Libraries: Import As Import As Import As Import As
No ratings yet
# Importing Necessary Libraries: Import As Import As Import As Import As
21 pages
Keeratsi HW8
No ratings yet
Keeratsi HW8
17 pages
Az4 Ipynb
No ratings yet
Az4 Ipynb
17 pages
DACLUSTER
No ratings yet
DACLUSTER
9 pages
Copy of ML - Assignment
No ratings yet
Copy of ML - Assignment
7 pages
Copy of Final Project
No ratings yet
Copy of Final Project
16 pages
DAR CompleteFile 1
No ratings yet
DAR CompleteFile 1
41 pages
MLT Ann Lab 2
No ratings yet
MLT Ann Lab 2
7 pages
Dsbda Exp4 Part1
No ratings yet
Dsbda Exp4 Part1
39 pages
Heart Disease Classification Full-1
No ratings yet
Heart Disease Classification Full-1
3 pages
Projet 2 Classification Des Crédits
No ratings yet
Projet 2 Classification Des Crédits
24 pages
1 4-EDA Ipynb
No ratings yet
1 4-EDA Ipynb
12 pages
Xgboost
No ratings yet
Xgboost
12 pages
Exp - 2-EDA - CaliforniaData Set - HeatMap - PairPlot-checkpoint - Jupyter Notebook
No ratings yet
Exp - 2-EDA - CaliforniaData Set - HeatMap - PairPlot-checkpoint - Jupyter Notebook
12 pages
Social Network Analysis: Cheruvu Nvss Suhas 21BCE8374
No ratings yet
Social Network Analysis: Cheruvu Nvss Suhas 21BCE8374
10 pages
Preprocessing1.ipynb - Colab
No ratings yet
Preprocessing1.ipynb - Colab
13 pages
Data Science Practicals - Ipynb
No ratings yet
Data Science Practicals - Ipynb
54 pages
Task 1
No ratings yet
Task 1
5 pages
A4 Dsbda Sana
No ratings yet
A4 Dsbda Sana
16 pages
Bose A S
No ratings yet
Bose A S
37 pages
Model2.ipynb - Colab
No ratings yet
Model2.ipynb - Colab
11 pages
Week 4
No ratings yet
Week 4
13 pages
Dsa 1
No ratings yet
Dsa 1
8 pages
B58 - Handling Missing Values, Feature - Selection
No ratings yet
B58 - Handling Missing Values, Feature - Selection
4 pages
Supply Chain Analytics
No ratings yet
Supply Chain Analytics
20 pages
Covid19-Maro (2) - JupyterLab
No ratings yet
Covid19-Maro (2) - JupyterLab
7 pages
Model
No ratings yet
Model
5 pages
Baseline - Ipynb - Colab
No ratings yet
Baseline - Ipynb - Colab
5 pages
1 Introduction To Statsmodels
No ratings yet
1 Introduction To Statsmodels
28 pages
KNN For Classification
No ratings yet
KNN For Classification
5 pages
ModuleAr Merged
No ratings yet
ModuleAr Merged
42 pages
Delhivery Mani
No ratings yet
Delhivery Mani
79 pages
Heart Disease Diagnosis Using Machine Learning
No ratings yet
Heart Disease Diagnosis Using Machine Learning
26 pages
Software Quality Metrics Overview
No ratings yet
Software Quality Metrics Overview
63 pages
Cleaning Data
No ratings yet
Cleaning Data
6 pages
Data Visualization EDA-print
No ratings yet
Data Visualization EDA-print
18 pages
MCQ On Dataframe
No ratings yet
MCQ On Dataframe
11 pages
B58 Random Forest
No ratings yet
B58 Random Forest
4 pages
SESION 12 (Pandas)
No ratings yet
SESION 12 (Pandas)
41 pages
Hikvision Cybersecurity Milestones
No ratings yet
Hikvision Cybersecurity Milestones
2 pages
Also Electric Curcuit Workbook With Solutions
No ratings yet
Also Electric Curcuit Workbook With Solutions
27 pages
EIN IRS MicroInformationTechnologies
100% (1)
EIN IRS MicroInformationTechnologies
2 pages
RetiCam 3100 Mini
No ratings yet
RetiCam 3100 Mini
4 pages
BBM 104 (Abhinav Pandey Sir)
No ratings yet
BBM 104 (Abhinav Pandey Sir)
4 pages
MILLIPEDE Concept
No ratings yet
MILLIPEDE Concept
23 pages
MRI Acronyms Brochure 2020
No ratings yet
MRI Acronyms Brochure 2020
12 pages
Chapter 7: Deadlocks: The Deadlock Problem System Model Deadlock Characterization Methods For Handling Deadlocks
No ratings yet
Chapter 7: Deadlocks: The Deadlock Problem System Model Deadlock Characterization Methods For Handling Deadlocks
63 pages
Inspection Checklist
No ratings yet
Inspection Checklist
11 pages
Evaluating Limits of Trigonometric and Exponential Functions
No ratings yet
Evaluating Limits of Trigonometric and Exponential Functions
12 pages
Dura Wall - Kuwadzana1
No ratings yet
Dura Wall - Kuwadzana1
7 pages
FREE CompuSec v5.3 Manual
No ratings yet
FREE CompuSec v5.3 Manual
61 pages
Learn Dutch On The Web Recommendations
No ratings yet
Learn Dutch On The Web Recommendations
3 pages
Unit 4 Physical Pharmaceutics 1
No ratings yet
Unit 4 Physical Pharmaceutics 1
37 pages
M2 Cert Pro Dev Exam v2 - 3 Study GD PDF
No ratings yet
M2 Cert Pro Dev Exam v2 - 3 Study GD PDF
21 pages
Módulos Canadian 440Wp
No ratings yet
Módulos Canadian 440Wp
2 pages
Joseph A. Mica
No ratings yet
Joseph A. Mica
7 pages
Are QSM Manual Rev 08
No ratings yet
Are QSM Manual Rev 08
43 pages
Plan 2023-PhD-Training - Martin - Marañón
No ratings yet
Plan 2023-PhD-Training - Martin - Marañón
3 pages
Quotation For Diesel Type Generator
No ratings yet
Quotation For Diesel Type Generator
2 pages
Adda247 - No. 1 APP For Banking & SSC Preparation
No ratings yet
Adda247 - No. 1 APP For Banking & SSC Preparation
6 pages
COF - International Cyber Olympiad 2025
No ratings yet
COF - International Cyber Olympiad 2025
12 pages
SHC Tracker Mar 2013
No ratings yet
SHC Tracker Mar 2013
8 pages
BD130 NPN Silicon Transistor Power Linerar and Switching Applications
No ratings yet
BD130 NPN Silicon Transistor Power Linerar and Switching Applications
3 pages
Svsdvsdvsdvsdvs
No ratings yet
Svsdvsdvsdvsdvs
6 pages
LBF 0320240002 (Karawang Foods) Isi Hal 2
No ratings yet
LBF 0320240002 (Karawang Foods) Isi Hal 2
2 pages
Essential n8n Playbook
From Everand
Essential n8n Playbook
Leandro Calado
No ratings yet
How to a Developers Guide to 4k: Developer edition, #3
From Everand
How to a Developers Guide to 4k: Developer edition, #3
Xinc Cyberwizard
No ratings yet

Covid 19 Analysis and Visualization Using Plotly Express

Uploaded by

Covid 19 Analysis and Visualization Using Plotly Express

Uploaded by

# Data analysis and Manipulation

{"summary":"{\n \"name\": \"dataset1\",\n \"rows\": 209,\n

# Returns tuple of shape (Rows, columns)

# Returns size of dataframe

# Information about Dataset1

{"summary":"{\n \"name\": \"dataset2\",\n \"rows\": 35156,\n

# Returns tuple of shape (Rows, columns)

# Returns size of dataframe

# Information about Dataset2

# Columns labels of a Dataset1

Index(['Country/Region', 'Continent', 'Population', 'TotalCases',

# Drop NewCases, NewDeaths, NewRecovered rows from dataset1

dataset1.drop(['NewCases', 'NewDeaths', 'NewRecovered'],

# Select random set of values from dataset1

{"summary":"{\n \"name\": \"dataset1\",\n \"rows\": 5,\n

# Import create_table Figure Factory

from plotly.figure_factory import create_table

colorscale = [[0, '#4d004c'], [.5, '#f2e5ff'], [1, '#ffffff']]

px.bar(dataset1.head(15), x = 'Country/Region', y = 'TotalCases',

px.bar(dataset1.head(15), x = 'Country/Region', y = 'TotalCases',

px.bar(dataset1.head(15), x = 'Country/Region', y = 'TotalCases',

px.bar(dataset1.head(15), x = 'TotalTests', y = 'Country/Region',

px.bar(dataset1.head(15), x = 'TotalTests', y = 'Continent',

px.scatter(dataset1.head(30), x='Country/Region', y= 'Tests/1M pop',

px.scatter(dataset1.head(30), x='Country/Region', y= 'Tests/1M pop',

px.scatter(dataset1.head(30), x='TotalCases', y= 'TotalDeaths',

px.scatter(dataset1.head(30), x='TotalCases', y= 'TotalDeaths',

px.scatter(dataset1.head(30), x='TotalTests', y= 'TotalCases',

px.bar(df_US, x="Date", y="Confirmed", color="Confirmed", height=400)

px.bar(df_US,x="Date", y="Recovered", color="Recovered", height=400)

px.line(df_US,x="Date", y="Recovered", height=400)

px.line(df_US,x="Date", y="Deaths", height=400)

px.line(df_US,x="Date", y="Confirmed", height=400)

px.line(df_US,x="Date", y="New cases", height=400)

px.bar(df_US,x="Date", y="New cases", height=400)

px.scatter(df_US, x="Confirmed", y="Deaths", height=400)

px.bar(dataset2, x="WHO Region", y="Confirmed", color="WHO Region",

{"summary":"{\n \"name\": \"dataset3\",\n \"rows\": 12260,\n

You might also like