0% found this document useful (0 votes)

10 views5 pages

03 Python 08 Plot Examples

The document provides a comprehensive guide on visualizing data using Python libraries such as pandas and matplotlib, focusing on life expectancy and health expenditure. It includes various plotting techniques, including line plots, bar plots, box plots, and heatmaps, while allowing user interaction for selecting countries and data types. Additionally, it covers password data analysis with visualizations for password categories and average online breaking times.

Uploaded by

dznz1999

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

10 views5 pages

03 Python 08 Plot Examples

Uploaded by

dznz1999

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 5

Visualization

Python
pandas and matplotlib
line plot
multiple line plots
barplot
boxplot
heatmap

Life Expectancy and Health Expenditure

FDATA = "./files/matplot.life-expectancy-vs-health-expenditure.csv"
OPTCHART = {1: ['Life Expectancy', 'LifeExpectancy','Number of years'], 2: ['Health
Expenditure','HealthExpenditure','Dollars/Capita Year']}
COLORS = {"LifeExpectancy": "#16acd8", "HealthExpenditure": "#4e16d8"}
COLRENAME = {'Entity':'Country'}

def menu():
strOut = ""
for key, val in OPTCHART.items():
strOut += str(key) + ": " + val[0] + "\n"
strOut += "Your choice: "
return strOut
print(menu())

df = pd.read_csv(FDATA)
df = df.rename(columns=COLRENAME)

#print(df.head())
# list of countries to check user's input
clist = df.Country.unique()

# select one Country for plotting

country = input("Country: ")
while country not in clist:
country = input("Country: ")
# select what data
opt = int(input(menu()))
while opt not in OPTCHART.keys():
opt = int(input(menu()))
colname = OPTCHART[opt][1]

selcol = {}
selcol[colname] = COLORS[colname]

# select data for chart

dfsel = df[(df.Country == country) & (~df[colname].isna())][['Year',colname]]
#print(dfsel)

Q1 plot one information for a selected country

pandas plot

# one line, no legend

ax = dfsel.plot.line(x='Year', legend=False, color=selcol)
plt.xlabel('Year')
plt.ylabel(OPTCHART[opt][2])
plt.title("pandas.plot.line: " +OPTCHART[opt][0] + "\n" + country.title())
#plt.show()

pandas plot - uses line

ax = dfsel.plot(x='Year', legend=False, color=selcol)

plt.xlabel('Year')
plt.ylabel(OPTCHART[opt][2])
plt.title("pandas.plot: " + OPTCHART[opt][0] + "\n" + country.title())
#plt.show()

matplotlib

fig, ax = plt.subplots()
plt.plot(dfsel['Year'], dfsel[colname], label=OPTCHART[opt][0]) # Set label for first
line
plt.xlabel('Year')
plt.ylabel(OPTCHART[opt][2])
plt.title("matplotlib: " + OPTCHART[opt][0] + "\n" + country.title())
plt.legend() # Show legend with the specified labels
#plt.show()

Q2 plot both data

## Two different Y axes

### separate charts
dfcountry = df[(df.Country == country) & (~df[colname].isna())]
fig, axes = plt.subplots(2, 1, figsize=(8, 10))
axes[0].plot(dfcountry.Year, dfcountry.LifeExpectancy)
axes[1].plot(dfcountry.Year, dfcountry.HealthExpenditure)
plt.show()

fig, ax1 = plt.subplots(figsize=(8, 8))

ax2 = ax1.twinx()
ax1.plot(dfcountry.Year, dfcountry.LifeExpectancy, color=COLORS['LifeExpectancy'])
ax2.plot(dfcountry.Year, dfcountry.HealthExpenditure,
color=COLORS['HealthExpenditure'])
ax1.set_xlabel("Year")
ax1.set_ylabel(OPTCHART[1][2])
#ax1.tick_params(axis="y", labelcolor=COLOR_TEMPERATURE)
ax2.set_ylabel(OPTCHART[2][2])
#ax2.tick_params(axis="y", labelcolor=COLOR_PRICE)
plt.show()

Q3 plot several selected countries

create table with column per country and plot with single chart

#TODO : ask the user a set of countries

countries = ['Italy','France']
dftab = df[(df.Country.isin(countries)) & (~df[colname].isna())]
[['Country','Year',colname]].pivot(index='Year', columns='Country', values=colname)
ax = dftab.plot(kind='line')
plt.ylabel(OPTCHART[opt][2])
#plt.title(OPTCHART[opt][0] + "\n(countries: " + ", ".join(countries).strip() + ")")
plt.title("pandas.plot - single chart: " + OPTCHART[opt][0])
plt.show()

one chart per country

#dfsel = df[(df.Country.isin(countries)) & (~df[colname].isna())]

[['Country','Year',colname]].pivot(index='Year', columns='Country', values=colname)
#print(dfsel)
ax = dftab.plot(kind='line', subplots=True, title="pandas.plot - multiple chart: " +
OPTCHART[opt][0])
plt.ylabel(OPTCHART[opt][2])
#it appears on the last subplot
#plt.title("pandas.plot - multiple chart: " + OPTCHART[opt][0])
plt.show()

matplotlib

# single char
fig, axes = plt.subplots()
for i, country in enumerate(countries):
plt.plot(dftab.index, dftab[country], label=country) # Plot each entity
plt.xlabel('Year')
plt.ylabel(OPTCHART[opt][2])
plt.title("matplotlib - single chart: " + OPTCHART[opt][0])
plt.legend(title='Country')
plt.show()

one chart per country

COLORS = ['#00202e', '#003f5c', '#2c4875', '#8a508f', '#bc5090', '#ff6361',

'#ff8531', '#ffa600']

ncountries = len(countries)
fig, axes = plt.subplots(ncountries, 1, figsize=(8, 6 * ncountries))
for i, country in enumerate(dftab.columns):
axes[i].plot(dftab.index, dftab[country], color=COLORS[i], legend=False)
axes[i].set_title(f'{country} Life Expectancy Over Years')
axes[i].set_xlabel('Year')
axes[i].set_ylabel(OPTCHART[opt][2])
plt.tight_layout()
plt.show()

Q4 boxplot

selcountries = ['France','Germany','Italy']
df.groupby('Year').agg({'LifeExpectancy':'mean'})
dfcs = df[(df['Year']>2000) & (df['Country'].isin(selcountries))]
[['Country','Year','LifeExpectancy','HealthExpenditure']]
#dfcs.groupby('Country')[['LifeExpectancy']].boxplot()
ax = dfcs.groupby('Country')[['LifeExpectancy']].boxplot(subplots=False)
ax.set_xticklabels(selcountries)

Passwords

FDATA = "./files/passwords.txt.csv"
FCAT = "./files/passwords.cat.csv"

TIMECONV = {'seconds': 1/3600,

'minutes': 1/60,
'hours': 1,
'days': 24,
'weeks': 168,
'months': 720,
'years': 8760}

dfp = pd.read_csv(FDATA)
dfc = pd.read_csv(FCAT)

dfp.head()
dfc.head()

dfp['online_hours'] = dfp['value']*dfp['time_unit'].map(TIMECONV)
dfp['online_hours'] = dfp['online_hours'].astype(int)
#dfp[dfp['online_hours'].isna()]

# number of passwords per category and average online breaking time

dfg = dfp[['catid','online_hours']].groupby(['catid']).agg({'catid': 'size',
'online_hours': 'mean'})
dfg.rename(columns={'catid': 'count'}, inplace=True)
dfg = dfg.reset_index()
dfres = dfg.merge(dfc, how='right', left_on='catid', right_on='id')
#print(dfres)

Q1 pandas number of passwords per category, showing the name

dfres.plot(kind='bar', x='category', y='count')

plt.ylabel('number of passwords')
plt.title('Plot on grouped - flat data')
plt.show()

pandas let it compute

dfpc = dfp.merge(dfc, how='right', left_on='catid', right_on='id')

dfpc[['category']].value_counts().plot(kind='bar', xlabel='Category', ylabel='Count',
rot=90)
plt.title('Plot value count')
plt.show()
#print(dfpc)

matplotlib

fig, ax = plt.subplots()
ax.bar(dfres['category'], dfres['online_hours'], width=1, edgecolor="white",
linewidth=0.7)
###
ncat = dfres['category'].nunique()
ax.set_xlim(-1,ncat)
###
plt.xticks(rotation=90)
plt.title('Matplot on grouped')
plt.show()

Q2 show average times

dfpc[dfpc.online_hours < 10000].boxplot(column=['online_hours'], by='category',

grid=False, color='black', rot=90)

histogram

dfpc[['strength']].plot(kind='hist')

Weed Identification Guide
No ratings yet
Weed Identification Guide
1 page
Exercises Part2
No ratings yet
Exercises Part2
7 pages
Data Visualization - New
No ratings yet
Data Visualization - New
5 pages
Intermediate Python
No ratings yet
Intermediate Python
22 pages
Intermediate Python
No ratings yet
Intermediate Python
22 pages
Final Group Project
No ratings yet
Final Group Project
26 pages
Final Coding
No ratings yet
Final Coding
9 pages
How To Open Without Moudlue
No ratings yet
How To Open Without Moudlue
9 pages
Intermediate - F (Autoguardado)
No ratings yet
Intermediate - F (Autoguardado)
70 pages
Matplotlib Pandas Guide
No ratings yet
Matplotlib Pandas Guide
7 pages
Mastering Data Visualization Techniques
No ratings yet
Mastering Data Visualization Techniques
159 pages
World Happiness Report
No ratings yet
World Happiness Report
7 pages
Data Science Assignment Submission
No ratings yet
Data Science Assignment Submission
12 pages
Histogramlar
No ratings yet
Histogramlar
18 pages
Mastering Data Visualization Techniques 1728896857
No ratings yet
Mastering Data Visualization Techniques 1728896857
85 pages
Mastering Data Visualization Techniques (Part 1)
No ratings yet
Mastering Data Visualization Techniques (Part 1)
20 pages
Modulo 8. Data Visualization With Python
No ratings yet
Modulo 8. Data Visualization With Python
30 pages
Can We Really Live Longer - A Machine Learning Study - by Nicolasdealba - Medium
No ratings yet
Can We Really Live Longer - A Machine Learning Study - by Nicolasdealba - Medium
34 pages
Data Visualization With Python
No ratings yet
Data Visualization With Python
42 pages
Matplotlib
No ratings yet
Matplotlib
5 pages
Basic Line Plot Using Matplotlib
No ratings yet
Basic Line Plot Using Matplotlib
9 pages
Data Visualization With Python
No ratings yet
Data Visualization With Python
34 pages
DVA Practical
No ratings yet
DVA Practical
19 pages
Line Plot (1) : Datacamp Courses-Jhu-Genomics-Demo
No ratings yet
Line Plot (1) : Datacamp Courses-Jhu-Genomics-Demo
22 pages
Pandas Cheat Sheet
No ratings yet
Pandas Cheat Sheet
2 pages
LAB4 EDA Desc Analysis
No ratings yet
LAB4 EDA Desc Analysis
26 pages
Intro To Pandas World Happiness
No ratings yet
Intro To Pandas World Happiness
20 pages
Ilovepdf Merged
No ratings yet
Ilovepdf Merged
89 pages
DAVP Lab Manual
No ratings yet
DAVP Lab Manual
12 pages
Fds Slips
No ratings yet
Fds Slips
6 pages
Five Year Dataset
No ratings yet
Five Year Dataset
15 pages
Pip
No ratings yet
Pip
3 pages
Data Visualization
No ratings yet
Data Visualization
70 pages
Country - Data (Record) - Jupyter Notebook
No ratings yet
Country - Data (Record) - Jupyter Notebook
5 pages
Aim: Objective
No ratings yet
Aim: Objective
7 pages
Matplotlib Pandas Guide
No ratings yet
Matplotlib Pandas Guide
9 pages
Data Visualization - 1 by Matplot Lib
No ratings yet
Data Visualization - 1 by Matplot Lib
19 pages
Data Visualization
No ratings yet
Data Visualization
48 pages
Python Slips
No ratings yet
Python Slips
9 pages
health_risk_prediction
No ratings yet
health_risk_prediction
80 pages
Code (Misbha & Nishi)
No ratings yet
Code (Misbha & Nishi)
10 pages
Healthcare Insurance Prediction Main
No ratings yet
Healthcare Insurance Prediction Main
74 pages
Basic Plotting
No ratings yet
Basic Plotting
8 pages
Assignment 6
No ratings yet
Assignment 6
5 pages
Chart Final Class
No ratings yet
Chart Final Class
8 pages
Experiment No 9
No ratings yet
Experiment No 9
13 pages
Terror Casualty Attack
No ratings yet
Terror Casualty Attack
6 pages
Code - Cap 3
No ratings yet
Code - Cap 3
5 pages
Datascience 2 PDF
No ratings yet
Datascience 2 PDF
24 pages
Matplotlib
No ratings yet
Matplotlib
15 pages
Assignment2 DMS672
No ratings yet
Assignment2 DMS672
15 pages
Course3 Notes
No ratings yet
Course3 Notes
44 pages
DV0101EN-2-2-1-Area-Plots-Histograms-and-Bar-Charts-py-v2.0: 1 Exploring Datasets With Pandas and Matplotlib
No ratings yet
DV0101EN-2-2-1-Area-Plots-Histograms-and-Bar-Charts-py-v2.0: 1 Exploring Datasets With Pandas and Matplotlib
29 pages
Program 2 Hierarchical Cluestring
No ratings yet
Program 2 Hierarchical Cluestring
5 pages
20 June BA Class
No ratings yet
20 June BA Class
17 pages
Data Visualization
No ratings yet
Data Visualization
159 pages
Data Analytics7
No ratings yet
Data Analytics7
5 pages
Regression and Eda
No ratings yet
Regression and Eda
47 pages
CP CH3 Ims555
No ratings yet
CP CH3 Ims555
8 pages
Quantum Field Theory
No ratings yet
Quantum Field Theory
26 pages
Text
No ratings yet
Text
15 pages
BOQ 20m Depth HDW
No ratings yet
BOQ 20m Depth HDW
1 page
R D Sin: Engineering Heat and Mass Transfer
No ratings yet
R D Sin: Engineering Heat and Mass Transfer
4 pages
Evaluation of Rock-Mass Permeability Tensor and Prediction of Tunnel Inflows by
No ratings yet
Evaluation of Rock-Mass Permeability Tensor and Prediction of Tunnel Inflows by
11 pages
347 Syllabus
No ratings yet
347 Syllabus
2 pages
Binding Effect of Cassava Starches On The Compression and Mechanical Properties of Ibuprofen Tablets
No ratings yet
Binding Effect of Cassava Starches On The Compression and Mechanical Properties of Ibuprofen Tablets
7 pages
Pattern Recognition Unit 1,2
No ratings yet
Pattern Recognition Unit 1,2
82 pages
IIT Video Lectures On Analog VLSI Design (Not Available in NPTEL)
No ratings yet
IIT Video Lectures On Analog VLSI Design (Not Available in NPTEL)
2 pages
CH 3 2020
No ratings yet
CH 3 2020
62 pages
Bushings IS 2099
No ratings yet
Bushings IS 2099
38 pages
Electronic Siren: October 3, 2013 by Engineeering Projects 0 Comments
No ratings yet
Electronic Siren: October 3, 2013 by Engineeering Projects 0 Comments
5 pages
Decreasing Wavelength Increasing Increasing Frequency Decreasing Increasing Energy Decreasing
No ratings yet
Decreasing Wavelength Increasing Increasing Frequency Decreasing Increasing Energy Decreasing
4 pages
Circular Motion 1
0% (1)
Circular Motion 1
1 page
Cape Chemistry 2012 U2 p2 Ms
100% (1)
Cape Chemistry 2012 U2 p2 Ms
9 pages
Ansys Motor-CAD 2023 R1 - 新功能介绍
No ratings yet
Ansys Motor-CAD 2023 R1 - 新功能介绍
35 pages
2619 1 5218 1 10 20160408 PDF
No ratings yet
2619 1 5218 1 10 20160408 PDF
14 pages
Statistical Treatment
No ratings yet
Statistical Treatment
7 pages
It Assignment - 1: Analog Signal Digital Signal
No ratings yet
It Assignment - 1: Analog Signal Digital Signal
6 pages
Math
No ratings yet
Math
2 pages
MC0082 - Theory of Computer Science
No ratings yet
MC0082 - Theory of Computer Science
235 pages
Class Ix Chemistry Notes Session 1 L1
No ratings yet
Class Ix Chemistry Notes Session 1 L1
3 pages
Level III - Ata 38 Water - Waste
No ratings yet
Level III - Ata 38 Water - Waste
40 pages
CSE 4204 FYDP Audit and Moderation Form Fall 2024
No ratings yet
CSE 4204 FYDP Audit and Moderation Form Fall 2024
6 pages
Welcome To Data Science Online Bootcamp
No ratings yet
Welcome To Data Science Online Bootcamp
18 pages
Bearings Constructions and Scale Drawings nXcM959JKxCN9hdp
No ratings yet
Bearings Constructions and Scale Drawings nXcM959JKxCN9hdp
18 pages
Pharmakokinetics E03 (Medlive by DR Priyanka)
No ratings yet
Pharmakokinetics E03 (Medlive by DR Priyanka)
371 pages

03 Python 08 Plot Examples

Uploaded by

03 Python 08 Plot Examples

Uploaded by

Visualization

Life Expectancy and Health Expenditure

# select one Country for plotting

# select data for chart

Q1 plot one information for a selected country

# one line, no legend

pandas plot - uses line

ax = dfsel.plot(x='Year', legend=False, color=selcol)

Q2 plot both data

## Two different Y axes

fig, ax1 = plt.subplots(figsize=(8, 8))

Q3 plot several selected countries

#TODO : ask the user a set of countries

one chart per country

#dfsel = df[(df.Country.isin(countries)) & (~df[colname].isna())]

one chart per country

COLORS = ['#00202e', '#003f5c', '#2c4875', '#8a508f', '#bc5090', '#ff6361',

TIMECONV = {'seconds': 1/3600,

# number of passwords per category and average online breaking time

Q1 pandas number of passwords per category, showing the name

dfres.plot(kind='bar', x='category', y='count')

pandas let it compute

dfpc = dfp.merge(dfc, how='right', left_on='catid', right_on='id')

Q2 show average times

dfpc[dfpc.online_hours < 10000].boxplot(column=['online_hours'], by='category',

You might also like