0% found this document useful (0 votes)

5 views7 pages

Exercises Part2

The document contains multiple Python scripts that perform data analysis and visualization using libraries such as pandas, matplotlib, seaborn, and statsmodels. Key analyses include time series decomposition of airline passenger data, interactive mapping of city populations, geographical plotting of world and Indian populations, and exploratory data analysis on wine quality and iris datasets. Each script demonstrates different techniques for data visualization, statistical analysis, and feature correlation.

Uploaded by

cse stud

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

5 views7 pages

Exercises Part2

Uploaded by

cse stud

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 7

EXE 5

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from statsmodels.tsa.seasonal import seasonal_decompose, STL
from statsmodels.graphics.tsaplots import plot_acf, plot_pacf

url =
"https://raw.githubusercontent.com/jbrownlee/Datasets/master/airline-passengers.csv"
df = pd.read_csv(url, parse_dates=['Month'], index_col='Month')
print(df.head())

plt.figure(figsize=(12, 6))
plt.plot(df.index, df['Passengers'], label="Passenger Count")
plt.title('Airline Passengers Over Time')
plt.xlabel('Year')
plt.ylabel('Number of Passengers')
plt.legend()
plt.show()

result = seasonal_decompose(df['Passengers'], model='multiplicative', period=12)

fig, (ax1, ax2, ax3, ax4) = plt.subplots(4, 1, figsize=(12, 8), sharex=True)
ax1.plot(result.trend); ax1.set_title("Trend Component")
ax2.plot(result.seasonal); ax2.set_title("Seasonal Component")
ax3.plot(result.resid); ax3.set_title("Residual Component")
ax4.plot(result.observed); ax4.set_title("Observed")
plt.tight_layout()
plt.show()

rolling_mean = df['Passengers'].rolling(window=12).mean()
rolling_std = df['Passengers'].rolling(window=12).std()
plt.figure(figsize=(12, 6))
plt.plot(df['Passengers'], label='Original')
plt.plot(rolling_mean, label='Rolling Mean (12 months)')
plt.plot(rolling_std, label='Rolling Std (12 months)')
plt.title('Rolling Mean & Standard Deviation')
plt.legend()
plt.show()

stl = STL(df['Passengers'], seasonal=13)

result_stl = stl.fit()
plt.figure(figsize=(12, 6))
plt.plot(result_stl.trend, label="Trend")
plt.plot(result_stl.seasonal, label='Seasonal')
plt.plot(result_stl.resid, label='Residual')
plt.title('Seasonal-Trend decomposition using LOESS (STL)')
plt.legend()
plt.show()

plt.figure(figsize=(12, 6))
plot_acf(df['Passengers'], lags=40, alpha=0.05)
plt.title('Autocorrelation Function (ACF)')
plt.show()

plt.figure(figsize=(12, 6))
plot_pacf(df['Passengers'], lags=40, alpha=0.05)
plt.title('Partial Autocorrelation Function (PACF)')
plt.show()
EXE 6
import folium
import pandas as pd

data = {
'City': ['New York', 'San Francisco', 'Los Angeles'],
'Population': [8175133, 884363, 3906772],
'Latitude': [40.7128, 37.7749, 34.0522],
'Longitude': [-74.0060, -122.4194, -118.2437]
}

df = pd.DataFrame(data)
map_center = [37.7749, -122.4194]
map_obj = folium.Map(location=map_center, zoom_start=5)

for index, row in df.iterrows():

folium.Marker(
location=[row["Latitude"], row["Longitude"]],
popup=f"City: {row['City']}\nPopulation: {row['Population']}",
tooltip=row["City"]
).add_to(map_obj)

map_obj.save('interactive_map.html')
EXE 7
import geopandas as gpd
from shapely.geometry import Polygon
import matplotlib.pyplot as plt
import pandas as pd

world = gpd.read_file(gpd.datasets.get_path('naturalearth_lowres'))
india_geometry = gpd.GeoSeries([Polygon([(75, 20), (80, 20), (80, 25), (75, 25)])],
crs="EPSG:4326")
india = gpd.GeoDataFrame(geometry=india_geometry)

world_data = {
'Country': ['USA', 'China', 'India'],
'Population': [331002651, 1444216107, 1380004385]
}
world_df = pd.DataFrame(world_data)

india_data = {
'State': ['Maharashtra', 'Uttar Pradesh', 'Tamil Nadu'],
'Population': [123144223, 223897418, 77841267]
}
india_df = pd.DataFrame(india_data)

world = world.merge(world_df, left_on='name', right_on='Country', how='left')

india['Population'] = india_df['Population']

fig, ax = plt.subplots(1, 2, figsize=(15, 7))

world.plot(column='Population', cmap='OrRd', ax=ax[0], legend=True,
legend_kwds={"label": "Population by Country"})
ax[0].set_title('World Population')

india.plot(column='Population', cmap='OrRd', ax=ax[1], legend=True,

legend_kwds={"label": "Population by State"})
ax[1].set_title('India Population')
plt.show()
EXE 8
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

data = pd.read_csv("winequalityN.csv")
print("First few rows of the dataset:")
print(data.head())

print("Summary statistics of the dataset:")

print(data.describe())

data.hist(bins=30, figsize=(12, 8))

plt.suptitle("Histograms of Features", y=1.02)
plt.show()

correlation_matrix = data.corr()
plt.figure(figsize=(10, 8))
sns.heatmap(correlation_matrix, annot=True, cmap="coolwarm", linewidths=0.5)
plt.title("Correlation Heatmap")
plt.show()

plt.figure(figsize=(12, 8))
sns.boxplot(data=data, width=0.5)
plt.xticks(rotation=45)
plt.title("Box Plots of Features")
plt.show()

plt.figure(figsize=(12, 6))
sns.histplot(data["alcohol"], kde=True)
plt.title("Alcohol Content Distribution")
plt.show()
EXE 9
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.datasets import load_iris

iris = load_iris()
data = pd.DataFrame(data=np.c_[iris['data'], iris['target']],
columns=iris['feature_names'] + ['target'])

print("First few rows of the dataset:")

print(data.head())

print("\nData Information:")
print(data.info())

print("\nSummary Statistics:")
print(data.describe())

sns.set(style="whitegrid")
plt.figure(figsize=(12, 6))
plt.subplot(1, 2, 1)
sns.histplot(data['sepal length (cm)'], kde=True)
plt.title("Distribution of Sepal Length")

plt.subplot(1, 2, 2)
sns.histplot(data['sepal width (cm)'], kde=True)
plt.title("Distribution of Sepal Width")
plt.show()

sns.pairplot(data, hue='target', markers=["o", "s", "D"])

plt.show()

plt.figure(figsize=(10, 6))
sns.boxplot(x='target', y='petal length (cm)', data=data)
plt.title("Petal Length Boxplot by Species")
plt.show()

correlation_matrix = data.corr()
plt.figure(figsize=(8, 6))
sns.heatmap(correlation_matrix, annot=True, cmap='coolwarm')
plt.title("Correlation Heatmap")
plt.show()

print("\nAnalysis Report:")
print("- The dataset contains three species of iris flowers: setosa, versicolor, and
virginica.")
print("- The features vary in their distributions, with sepal length and sepal width
showing different patterns.")
print("- The pairplot shows how the features are correlated and how they can be used to
distinguish between species.")
print("- The petal length is a strong predictor for species differentiation, with setosa
having the shortest petals and virginica the longest.")
print("- The correlation heatmap confirms that petal length is highly correlated with
the target variable, making it an important feature for classification.")

Claves Acceso Journals
83% (6)
Claves Acceso Journals
84 pages
PC Gr500ex 2
100% (1)
PC Gr500ex 2
880 pages
Data Visualization
No ratings yet
Data Visualization
70 pages
Code - Cap 3
No ratings yet
Code - Cap 3
5 pages
Chirayu (1) Merged Merged
No ratings yet
Chirayu (1) Merged Merged
76 pages
100 Ansministère de La Famille Adventiste
No ratings yet
100 Ansministère de La Famille Adventiste
125 pages
Introduction To Matplotlib
No ratings yet
Introduction To Matplotlib
58 pages
Visualization RST
No ratings yet
Visualization RST
33 pages
Ai&Ml Bail606 ML Lab Manual
No ratings yet
Ai&Ml Bail606 ML Lab Manual
50 pages
Regression and Eda
No ratings yet
Regression and Eda
47 pages
Pandas 3-2
No ratings yet
Pandas 3-2
27 pages
Target Value Delivery 10.17.17 Pikel
No ratings yet
Target Value Delivery 10.17.17 Pikel
93 pages
2 Trends Seasonality and Residuals Explained!-Copy1
No ratings yet
2 Trends Seasonality and Residuals Explained!-Copy1
14 pages
#1 Ok - Actual Let Exam
No ratings yet
#1 Ok - Actual Let Exam
24 pages
Plotting Directly With Matplotlib: Objectives
No ratings yet
Plotting Directly With Matplotlib: Objectives
28 pages
Data Visualization With Python
No ratings yet
Data Visualization With Python
42 pages
Five Year Dataset
No ratings yet
Five Year Dataset
15 pages
West Rox
No ratings yet
West Rox
29 pages
Presentation 1
No ratings yet
Presentation 1
30 pages
Exceed
No ratings yet
Exceed
344 pages
01 - Lesson - Visualization - Jupyter Notebook
No ratings yet
01 - Lesson - Visualization - Jupyter Notebook
18 pages
Untitled 5
No ratings yet
Untitled 5
10 pages
Lab4 Narciso
No ratings yet
Lab4 Narciso
6 pages
MLRecord
No ratings yet
MLRecord
24 pages
0.1 Exercise 26: Flights Dataset - Time Series Visualization and Analysis
No ratings yet
0.1 Exercise 26: Flights Dataset - Time Series Visualization and Analysis
8 pages
Pandas Plots
No ratings yet
Pandas Plots
14 pages
Preksha Ai Practical Class 10th - 070428
No ratings yet
Preksha Ai Practical Class 10th - 070428
13 pages
DVA Practical
No ratings yet
DVA Practical
19 pages
Sl-3 Assignment No.8
No ratings yet
Sl-3 Assignment No.8
21 pages
03 Python 08 Plot Examples
No ratings yet
03 Python 08 Plot Examples
5 pages
Crypt of Cthulhu 023 Cryptic.1984 Wolfhound
100% (4)
Crypt of Cthulhu 023 Cryptic.1984 Wolfhound
58 pages
Learn Seaborn 1674064934
No ratings yet
Learn Seaborn 1674064934
24 pages
Saikat Dey Data Science Project
No ratings yet
Saikat Dey Data Science Project
14 pages
DAVP Lab Manual
No ratings yet
DAVP Lab Manual
12 pages
Data Analyzer
No ratings yet
Data Analyzer
10 pages
Matplotlib Pandas Guide
No ratings yet
Matplotlib Pandas Guide
7 pages
ML Expt 1 Description
No ratings yet
ML Expt 1 Description
15 pages
Chart Final Class
No ratings yet
Chart Final Class
8 pages
Data Visualization Part 2
No ratings yet
Data Visualization Part 2
18 pages
CSE315:Introduction To Data Science: WEEK-8
No ratings yet
CSE315:Introduction To Data Science: WEEK-8
27 pages
Basic Plotting
No ratings yet
Basic Plotting
8 pages
Assignment 2 - Jupyter Notebook
No ratings yet
Assignment 2 - Jupyter Notebook
8 pages
Time Series Analysis Group 9
No ratings yet
Time Series Analysis Group 9
16 pages
Advanced Plot Types With Seaborn
No ratings yet
Advanced Plot Types With Seaborn
8 pages
Rain Fall
No ratings yet
Rain Fall
4 pages
Exp 2 SDK Ok
No ratings yet
Exp 2 SDK Ok
18 pages
Teaching and Learning 21st Century Skills
No ratings yet
Teaching and Learning 21st Century Skills
37 pages
Sapkas & Kollar - Lateral-Torsional Buckling of Composite Beams (2002)
No ratings yet
Sapkas & Kollar - Lateral-Torsional Buckling of Composite Beams (2002)
25 pages
Matplotlib Plots
No ratings yet
Matplotlib Plots
13 pages
Subject Matter of Book
No ratings yet
Subject Matter of Book
9 pages
Modulo 8. Data Visualization With Python
No ratings yet
Modulo 8. Data Visualization With Python
30 pages
Python Slips
No ratings yet
Python Slips
9 pages
Pandas
No ratings yet
Pandas
25 pages
Pandas Notes
No ratings yet
Pandas Notes
27 pages
Pandas Complete + Visualisation Summary of IBM Visualization
No ratings yet
Pandas Complete + Visualisation Summary of IBM Visualization
21 pages
Group Lesson Plan
83% (6)
Group Lesson Plan
7 pages
Mid Year Review Form T I III SY 2023 2024
No ratings yet
Mid Year Review Form T I III SY 2023 2024
5 pages
Cheat Python
No ratings yet
Cheat Python
8 pages
Matplotlib Pandas Guide
No ratings yet
Matplotlib Pandas Guide
9 pages
4 PythonPandas
No ratings yet
4 PythonPandas
8 pages
Data Visualization With Python
No ratings yet
Data Visualization With Python
34 pages
Area Plots, Histogram and Bar Plots in Python
No ratings yet
Area Plots, Histogram and Bar Plots in Python
9 pages
Summary: Introduction To Data Visualization Tools
No ratings yet
Summary: Introduction To Data Visualization Tools
13 pages
Multimedia Programming Interface and Data Specifications 1.0
No ratings yet
Multimedia Programming Interface and Data Specifications 1.0
97 pages
Data Science Assignment Submission
No ratings yet
Data Science Assignment Submission
12 pages
Print Print Print Print: Import As
No ratings yet
Print Print Print Print: Import As
6 pages
Main - Py Text File
No ratings yet
Main - Py Text File
5 pages
Using Python For Data Analysis - July 2018 - Slides
No ratings yet
Using Python For Data Analysis - July 2018 - Slides
43 pages
Samsung Ls15e-17e TV Service Manual
No ratings yet
Samsung Ls15e-17e TV Service Manual
74 pages
Construction of Closet, Fence, Ceiling of Cabana and Floor Tiles of Toilet
No ratings yet
Construction of Closet, Fence, Ceiling of Cabana and Floor Tiles of Toilet
6 pages
Baza Date Pitesti
No ratings yet
Baza Date Pitesti
8 pages
2.1 Exploratory Data Analysis Using Python
No ratings yet
2.1 Exploratory Data Analysis Using Python
12 pages
Sorry - Justin Bieber 1. Listen and Complete.: Portraductoras
No ratings yet
Sorry - Justin Bieber 1. Listen and Complete.: Portraductoras
2 pages
EDE Microproejct 1 by Campusify
No ratings yet
EDE Microproejct 1 by Campusify
23 pages
Revised Student Handbook 2020 2025 Guyana Campus NEW Adjusted Candice Alvarez
No ratings yet
Revised Student Handbook 2020 2025 Guyana Campus NEW Adjusted Candice Alvarez
52 pages
S5 Comp Mce Q A
No ratings yet
S5 Comp Mce Q A
17 pages
Data Visualization - New
No ratings yet
Data Visualization - New
5 pages
No Ph.D. Game Design With Three.js
From Everand
No Ph.D. Game Design With Three.js
Nikiforos Kontopoulos
No ratings yet
"The Causes and Significance of The Iranian Revolution" by Said Amir Arjomand (1985)
No ratings yet
"The Causes and Significance of The Iranian Revolution" by Said Amir Arjomand (1985)
27 pages
Syllabus For Undergraduate and Graduate Guitar Lessons - 36
No ratings yet
Syllabus For Undergraduate and Graduate Guitar Lessons - 36
9 pages
Worksheet For VIII Class in PDF Form
No ratings yet
Worksheet For VIII Class in PDF Form
5 pages
Pandas Cheat Sheet
No ratings yet
Pandas Cheat Sheet
2 pages
WEBINTEL GUIDED LAB ACTIVITY Introduction To Pandas
No ratings yet
WEBINTEL GUIDED LAB ACTIVITY Introduction To Pandas
1 page
Ldpe 2101TN47
No ratings yet
Ldpe 2101TN47
3 pages
Mala'ati Report 2025 01 22 08 23
No ratings yet
Mala'ati Report 2025 01 22 08 23
12 pages
Embedded IoT Important Questions
No ratings yet
Embedded IoT Important Questions
2 pages
Internationale Bewerbende Merkblatt Auswahlkommission English
No ratings yet
Internationale Bewerbende Merkblatt Auswahlkommission English
4 pages
Synopsis of Project
No ratings yet
Synopsis of Project
4 pages
Table of Contents - 2
No ratings yet
Table of Contents - 2
1 page
CCS (2-Marks)
No ratings yet
CCS (2-Marks)
2 pages
Circular 878
No ratings yet
Circular 878
1 page
Activity No. 2 Nervous Sys.
No ratings yet
Activity No. 2 Nervous Sys.
3 pages
5000 Words
No ratings yet
5000 Words
1 page
Eli Reiter Resume
No ratings yet
Eli Reiter Resume
1 page