0% found this document useful (0 votes)

3 views4 pages

#Exp2 Eda On 2 Variable Dataset

The document outlines an exploratory data analysis (EDA) on the Iris dataset, focusing on the relationship between sepal length and petal length using linear regression. It includes visualizations such as boxplots and heatmaps, and compares regression models with and without bias. Additionally, it demonstrates the classification of a synthetic dataset using a perceptron model with and without bias, reporting the accuracy for both models.

Uploaded by

22b137

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

3 views4 pages

#Exp2 Eda On 2 Variable Dataset

Uploaded by

22b137

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 4

#EXP2 EDA ON 2 VARIABLE DATASET

import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt
from sklearn.linear_model import LinearRegression
from sklearn.model_selection import train_test_split
from sklearn.metrics import mean_squared_error, r2_score

df = sns.load_dataset("iris")

# ---------- 1. Check Categorical Variable (Species) ----------

print("\nUnique Species in Dataset:", df['species'].unique())

# Boxplot: Species vs Sepal Length

plt.figure(figsize=(10, 5))
sns.boxplot(x="species", y="sepal_length", data=df, palette="coolwarm")
plt.title("Sepal Length Distribution Across Species")
plt.show()

# ---------- 2. Correlation Heatmap ----------

plt.figure(figsize=(8, 6))
sns.heatmap(df.corr(numeric_only=True), annot=True, cmap="coolwarm", fmt=".2f")
plt.title("Feature Correlation Heatmap")
plt.show()

# ---------- 3. Simple Linear Regression ----------

X = df[['sepal_length']] # Independent variable
y = df['petal_length'] # Dependent variable
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Train the model

model = LinearRegression()
model.fit(X_train, y_train)

# Predictions
y_pred = model.predict(X_test)

# Model evaluation
mse = mean_squared_error(y_test, y_pred)
r2 = r2_score(y_test, y_pred)

# Print results
print(f"\nModel Coefficient: {model.coef_[0]:.2f}")
print(f"Model Intercept: {model.intercept_:.2f}")
print(f"Mean Squared Error: {mse:.2f}")
print(f"R2 Score: {r2:.2f}")

plt.figure(figsize=(8, 6))
sns.scatterplot(x=X_test['sepal_length'], y=y_test, hue=df['species'],palette="viridis",
legend=False)
sns.lineplot(x=X_test['sepal_length'], y=y_pred, color='red',label='Regression Line')

plt.xlabel("Sepal Length")
plt.ylabel("Petal Length")
plt.title("Linear Regression: Sepal Length vs Petal Length")
plt.legend()

plt.show()

#REGRESSION MODEL WITH BIAS AND WITHOUT BIAS

import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error

# Load dataset
data = sns.load_dataset('iris')

# Use Sepal & Petal features (X) and Petal Length as target (y)
X = data[['sepal_length', 'sepal_width', 'petal_length', 'petal_width']].values
y = data['petal_length'].values
species = data['species']

# Split into train/test

X_train, X_test, y_train, y_test, species_train, species_test = train_test_split(
X, y, species, test_size=0.2, random_state=42
)

# ----------- Model WITH Bias (fit_intercept=True) -----------

model1 = LinearRegression()
model1.fit(X_train[:, 0:1], y_train) # Use only sepal_length
pred1 = model1.predict(X_test[:, 0:1])
mse1 = mean_squared_error(y_test, pred1)
print("MSE with Bias:", round(mse1, 2))
# ----------- Model WITHOUT Bias (fit_intercept=False) -----------
model2 = LinearRegression(fit_intercept=False)
model2.fit(X_train[:, 0:1], y_train)
pred2 = model2.predict(X_test[:, 0:1])
mse2 = mean_squared_error(y_test, pred2)
print("MSE without Bias:", round(mse2, 2))

# ----------- Comparison Plot -----------

plt.figure(figsize=(12, 5))

# Plot 1: With Bias

plt.subplot(1, 2, 1)
sns.scatterplot(x=X_test[:, 0], y=y_test, hue=species_test, palette='viridis', alpha=0.7)
plt.plot(X_test[:, 0], pred1, color='red', label='With Bias')
plt.title('With Bias')
plt.xlabel('Sepal Length')
plt.ylabel('Petal Length')
plt.legend()

# Plot 2: Without Bias

plt.subplot(1, 2, 2)
sns.scatterplot(x=X_test[:, 0], y=y_test, hue=species_test, palette='viridis', alpha=0.7)
plt.plot(X_test[:, 0], pred2, color='blue', label='Without Bias')
plt.title('Without Bias')
plt.xlabel('Sepal Length')
plt.ylabel('Petal Length')
plt.legend()

plt.tight_layout()
plt.show()

#EXP 4
Classification of a dataset from UCI repository using a perceptron with bias
and without bias
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.linear_model import Perceptron
from sklearn.metrics import accuracy_score
from sklearn.datasets import make_classification

# Generate a synthetic dataset

X, y = make_classification(n_samples=1000, n_features=20, n_classes=2, random_state=0)
# Splitting the dataset into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=0)

# Fitting a perceptron model without bias

model_no_bias = Perceptron(fit_intercept=False)
model_no_bias.fit(X_train, y_train)
y_pred_no_bias = model_no_bias.predict(X_test)
accuracy_no_bias = accuracy_score(y_test, y_pred_no_bias)
print("Accuracy of perceptron without bias:", accuracy_no_bias)

# Fitting a perceptron model with bias

model_with_bias = Perceptron(fit_intercept=True)
model_with_bias.fit(X_train, y_train)
y_pred_with_bias = model_with_bias.predict(X_test)
accuracy_with_bias = accuracy_score(y_test, y_pred_with_bias)
print("Accuracy of perceptron with bias:", accuracy_with_bias)

Eai Exp 2-5
No ratings yet
Eai Exp 2-5
13 pages
ML Minimized Programs
No ratings yet
ML Minimized Programs
9 pages
Set B
No ratings yet
Set B
4 pages
Lab Manual ML
No ratings yet
Lab Manual ML
23 pages
ML
No ratings yet
ML
11 pages
ML Functions
No ratings yet
ML Functions
12 pages
All in One
No ratings yet
All in One
13 pages
ML Four To Eight
No ratings yet
ML Four To Eight
3 pages
Aiml Codes
No ratings yet
Aiml Codes
11 pages
Naive Bayes Classification Numerical Example With Code
No ratings yet
Naive Bayes Classification Numerical Example With Code
8 pages
DM ML Practical
No ratings yet
DM ML Practical
13 pages
DA Practicle Answers Easyw
No ratings yet
DA Practicle Answers Easyw
30 pages
CO3
No ratings yet
CO3
8 pages
ML Lab Programs
No ratings yet
ML Lab Programs
23 pages
PR
No ratings yet
PR
17 pages
LinearRegression Iris
No ratings yet
LinearRegression Iris
4 pages
7f18e5b8-c197-4086-98da-243347927150
No ratings yet
7f18e5b8-c197-4086-98da-243347927150
3 pages
Implementing Logistic Regression For Iris Using Sklearn and Checking The Accuracy Using Confusion Matrix
No ratings yet
Implementing Logistic Regression For Iris Using Sklearn and Checking The Accuracy Using Confusion Matrix
7 pages
22MCA1008 - Varun ML LAB ASSIGNMENTS
100% (1)
22MCA1008 - Varun ML LAB ASSIGNMENTS
41 pages
E22cseu1389 Assignment10 1
No ratings yet
E22cseu1389 Assignment10 1
5 pages
ML L - Ab
No ratings yet
ML L - Ab
13 pages
Allcodesml 2
No ratings yet
Allcodesml 2
10 pages
Machine
100% (1)
Machine
45 pages
1
No ratings yet
1
13 pages
Decision Tree
No ratings yet
Decision Tree
2 pages
TranMinhTu1 bt2 2
No ratings yet
TranMinhTu1 bt2 2
5 pages
Print Out ML - Finallllllllllllllll
No ratings yet
Print Out ML - Finallllllllllllllll
11 pages
Support Vector Machine
No ratings yet
Support Vector Machine
7 pages
Assignment 5
No ratings yet
Assignment 5
5 pages
Axxela Interview Questions
No ratings yet
Axxela Interview Questions
25 pages
KRAI LabManual
No ratings yet
KRAI LabManual
77 pages
KRAI Practical
No ratings yet
KRAI Practical
14 pages
L3 - Classification - RandomForest - Jupyter Notebook
No ratings yet
L3 - Classification - RandomForest - Jupyter Notebook
6 pages
Aiml Practicals
No ratings yet
Aiml Practicals
22 pages
ML
No ratings yet
ML
17 pages
AI ML - Cycle 2 Programs
No ratings yet
AI ML - Cycle 2 Programs
15 pages
Btech1007022 Lab5
No ratings yet
Btech1007022 Lab5
14 pages
Jaswinder Pal Singh 2024-04-05: Library Data Print Unique
No ratings yet
Jaswinder Pal Singh 2024-04-05: Library Data Print Unique
4 pages
Experiment 2
No ratings yet
Experiment 2
15 pages
Mlda - Lab
No ratings yet
Mlda - Lab
35 pages
MlLabManualdocx 2024 09 04 22 02 58
No ratings yet
MlLabManualdocx 2024 09 04 22 02 58
19 pages
DSBDA05
No ratings yet
DSBDA05
5 pages
LAB-4 Report
No ratings yet
LAB-4 Report
21 pages
Econometrics Chapter Two
No ratings yet
Econometrics Chapter Two
92 pages
Machine Learning LAB: Practical-1
100% (2)
Machine Learning LAB: Practical-1
24 pages
Data Science Manual
No ratings yet
Data Science Manual
16 pages
Btech1007022 Lab5.1
No ratings yet
Btech1007022 Lab5.1
9 pages
Minor Lab
No ratings yet
Minor Lab
4 pages
ML Lab 01999676272
No ratings yet
ML Lab 01999676272
12 pages
Machine Learning With SQL
100% (1)
Machine Learning With SQL
12 pages
10 SupportVectorMachine Demo Code
No ratings yet
10 SupportVectorMachine Demo Code
2 pages
SC Assignment Q2
No ratings yet
SC Assignment Q2
7 pages
IPB Inner Model
No ratings yet
IPB Inner Model
165 pages
Data Mining Practicals
No ratings yet
Data Mining Practicals
22 pages
19mid0034 (Chandru) - ML Lab Fat - Jupyter Notebook
No ratings yet
19mid0034 (Chandru) - ML Lab Fat - Jupyter Notebook
4 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
Practical 6
No ratings yet
Practical 6
8 pages
Setup: This Notebook Contains All The Sample Code and Solutions To The Exercises in Chapter 3
No ratings yet
Setup: This Notebook Contains All The Sample Code and Solutions To The Exercises in Chapter 3
30 pages
Impact Evaluation in Practice (Second Edition) Offers A Comprehensive and Accessible Introduction To
No ratings yet
Impact Evaluation in Practice (Second Edition) Offers A Comprehensive and Accessible Introduction To
39 pages
PE Civil: Transportation Ebook Practice Exam
No ratings yet
PE Civil: Transportation Ebook Practice Exam
41 pages
01 - Simple Linear Regression
No ratings yet
01 - Simple Linear Regression
24 pages
Linearregression SVM
No ratings yet
Linearregression SVM
3 pages
ML Lab
No ratings yet
ML Lab
7 pages
SVM K NN MLP With Sklearn Jupyter NoteBo
No ratings yet
SVM K NN MLP With Sklearn Jupyter NoteBo
22 pages
Aiml Ex 4-7
No ratings yet
Aiml Ex 4-7
8 pages
Quant DTUT Chap5 Forecasting
No ratings yet
Quant DTUT Chap5 Forecasting
72 pages
Lec Topic3
No ratings yet
Lec Topic3
51 pages
Sta457 Week 2 Notes
No ratings yet
Sta457 Week 2 Notes
18 pages
Lecture 04
No ratings yet
Lecture 04
19 pages
Econometrics Chapter Three
No ratings yet
Econometrics Chapter Three
35 pages
MBA623 MBA 2B9 DASMA ESPINARGrp Forecasting - Model
No ratings yet
MBA623 MBA 2B9 DASMA ESPINARGrp Forecasting - Model
32 pages
Time Series Analysis in R A Beginner's Guide
No ratings yet
Time Series Analysis in R A Beginner's Guide
13 pages
TSF Sri
No ratings yet
TSF Sri
14 pages
Chapter 3 (Part 3) : Equation of States For Non Ideal Gases and Liquids
No ratings yet
Chapter 3 (Part 3) : Equation of States For Non Ideal Gases and Liquids
56 pages
ECS3706 Exam Pack-1 (1) (1) Ecs4863
No ratings yet
ECS3706 Exam Pack-1 (1) (1) Ecs4863
25 pages
Market Risk Analysis VaR Expected Shortfall Presentation
No ratings yet
Market Risk Analysis VaR Expected Shortfall Presentation
15 pages
GC Ensemble With Ideal Gas 2 PDF
No ratings yet
GC Ensemble With Ideal Gas 2 PDF
2 pages
Statistical Inferences Presentation
No ratings yet
Statistical Inferences Presentation
11 pages
PH Ysicsguide: Basic Concepts of Statistical Mechanics
No ratings yet
PH Ysicsguide: Basic Concepts of Statistical Mechanics
14 pages
Analisis Berganda SPSS Dan Responden
No ratings yet
Analisis Berganda SPSS Dan Responden
3 pages
Review 2 K49
No ratings yet
Review 2 K49
4 pages
Knife Method (Ba)
No ratings yet
Knife Method (Ba)
3 pages
Practicals For Basic Econometrics-2.Docx 20241118 002851 0000
No ratings yet
Practicals For Basic Econometrics-2.Docx 20241118 002851 0000
3 pages
#QF604 MCQ Practice Test 4
No ratings yet
#QF604 MCQ Practice Test 4
4 pages
Advance Statistics (Simple Linear Regression)
No ratings yet
Advance Statistics (Simple Linear Regression)
3 pages
Section 3 - Statistical Mechanics
No ratings yet
Section 3 - Statistical Mechanics
25 pages
Multiple Regression - WPS Office
No ratings yet
Multiple Regression - WPS Office
2 pages
EC226 - Econometrics (Revision Guide - Simple Linear Regression)
No ratings yet
EC226 - Econometrics (Revision Guide - Simple Linear Regression)
9 pages
Application of Partition Function
No ratings yet
Application of Partition Function
2 pages
TensorFlow深度学习项目实战: Chinese Edition
From Everand
TensorFlow深度学习项目实战: Chinese Edition
Posts & Telecom Press
No ratings yet

#Exp2 Eda On 2 Variable Dataset

Uploaded by

#Exp2 Eda On 2 Variable Dataset

Uploaded by

#EXP2 EDA ON 2 VARIABLE DATASET

# ---------- 1. Check Categorical Variable (Species) ----------

# Boxplot: Species vs Sepal Length

# ---------- 2. Correlation Heatmap ----------

# ---------- 3. Simple Linear Regression ----------

# Train the model

#REGRESSION MODEL WITH BIAS AND WITHOUT BIAS

# Split into train/test

# ----------- Model WITH Bias (fit_intercept=True) -----------

# ----------- Comparison Plot -----------

# Plot 1: With Bias

# Plot 2: Without Bias

# Generate a synthetic dataset

# Fitting a perceptron model without bias

# Fitting a perceptron model with bias

You might also like