0% found this document useful (0 votes)

36 views4 pages

Lab7 Hameed 211086

Uploaded by

Abdul Moaid

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

36 views4 pages

Lab7 Hameed 211086

Uploaded by

Abdul Moaid

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 4

3/19/24, 11:44 PM lab7.

ipynb - Colaboratory

Name Hameed Ullah

211086-A

AI Lab TASK 7

# Importing necessary libraries

from sklearn.tree import DecisionTreeClassifier
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import train_test_split
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from matplotlib.colors import ListedColormap

# Load the dataset

file_path = "/content/drive/MyDrive/Colab Notebooks/KDDTrain+.txt"
column_names = ["duration", "protocol_type", "attack_type"]
data = pd.read_csv(file_path, header=None, names=column_names)

# Preprocessing
selected_columns = ["duration", "protocol_type", "attack_type"]
preprocessed_data = data[selected_columns]

# Check for missing values

print(preprocessed_data.isnull().sum())

# Splitting the dataset into features (x) and target (y)

x = preprocessed_data.drop(columns=["attack_type"])
y = preprocessed_data["attack_type"]

# Splitting the dataset into training and test sets

x_train, x_test, y_train, y_test = train_test_split(x, y, test_size=0.25, random_state=0)

# Check data types

print(x_train.dtypes)

# Convert 'protocol_type' to numeric using label encoding

label_encoder = LabelEncoder()
x_train['protocol_type_encoded'] = label_encoder.fit_transform(x_train['protocol_type'])

# Extract x and y variables for visualization

x_set = x_train[['duration', 'protocol_type_encoded']].values
y_set = y_train.values

# Check data types after label encoding

print(x_set.dtype)
print(np.isnan(x_set).sum())

# Fitting Decision Tree classifier to the training set

classifier = DecisionTreeClassifier(criterion='entropy', random_state=0)
classifier.fit(x_set, y_set)

# Meshgrid creation
x1_min, x1_max = x_set[:, 0].min() - 1, x_set[:, 0].max() + 1
x2_min, x2_max = x_set[:, 1].min() - 1, x_set[:, 1].max() + 1
x1, x2 = np.meshgrid(np.arange(start=x1_min, stop=x1_max, step=1),
np.arange(start=x2_min, stop=x2_max, step=1))

# Plotting the decision boundary

plt.figure(figsize=(10, 6))
plt.contourf(x1, x2, classifier.predict(np.array([x1.ravel(), x2.ravel()]).T).reshape(x1.shape),
alpha=0.75, cmap=ListedColormap(('purple', 'green')))

# Plotting the data points

for i, j in enumerate(np.unique(y_set)):
plt.scatter(x_set[y_set == j, 0], x_set[y_set == j, 1],
c=ListedColormap(('purple', 'green'))(i), label=j)

# Setting plot labels and legend

plt.xlim(x1.min(), x1.max())
https://colab.research.google.com/drive/1QkVj8I_GkxQLWkwssl4-iFD1oQmMIZ9Y#scrollTo=51BptnM6_KHL&printMode=true 1/4
3/19/24, 11:44 PM lab7.ipynb - Colaboratory
p ( (), ())
plt.ylim(x2.min(), x2.max())
plt.title('Decision Tree Algorithm (Training set)')
plt.xlabel('duration')
plt.ylabel('protocol_type_encoded')
plt.legend()

# Show plot
plt.show()

duration 0
protocol_type 0
attack_type 0
dtype: int64
duration float64
protocol_type object
dtype: object
float64
0
<ipython-input-25-49c950067830>:61: UserWarning: *c* argument looks like a single numeric RGB or RGBA sequence, wh
plt.scatter(x_set[y_set == j, 0], x_set[y_set == j, 1],

# Importing necessary libraries

# Load the dataset

file_path = "/content/drive/MyDrive/Colab Notebooks/KDDTest+.txt"
column_names = ["duration", "protocol_type", "attack_type"]
data = pd.read_csv(file_path, header=None, names=column_names)

# Preprocessing
selected_columns = ["duration", "protocol_type", "attack_type"]
preprocessed_data = data[selected_columns]

# Check for missing values

i t( d d t i ll() ())
https://colab.research.google.com/drive/1QkVj8I_GkxQLWkwssl4-iFD1oQmMIZ9Y#scrollTo=51BptnM6_KHL&printMode=true 2/4
3/19/24, 11:44 PM lab7.ipynb - Colaboratory
print(preprocessed_data.isnull().sum())

# Splitting the dataset into features (x) and target (y)

x = preprocessed_data.drop(columns=["attack_type"])
y = preprocessed_data["attack_type"]

# Splitting the dataset into training and test sets

x_train, x_test, y_train, y_test = train_test_split(x, y, test_size=0.25, random_state=0)

# Check data types

print(x_train.dtypes)

# Convert 'protocol_type' to numeric using label encoding

label_encoder = LabelEncoder()
x_train['protocol_type_encoded'] = label_encoder.fit_transform(x_train['protocol_type'])

# Extract x and y variables for visualization

x_set = x_train[['duration', 'protocol_type_encoded']].values
y_set = y_train.values

# Check data types after label encoding

print(x_set.dtype)
print(np.isnan(x_set).sum())

# Fitting Decision Tree classifier to the training set

classifier = DecisionTreeClassifier(criterion='entropy', random_state=0)
classifier.fit(x_set, y_set)

# Plotting the decision boundary

plt.figure(figsize=(10, 6))
plt.contourf(x1, x2, classifier.predict(np.array([x1.ravel(), x2.ravel()]).T).reshape(x1.shape),
alpha=0.75, cmap=ListedColormap(('purple', 'green')))

# Plotting the data points

for i, j in enumerate(np.unique(y_set)):
plt.scatter(x_set[y_set == j, 0], x_set[y_set == j, 1],
c=ListedColormap(('purple', 'green'))(i), label=j)

# Setting plot labels and legend

plt.xlim(x1.min(), x1.max())
plt.ylim(x2.min(), x2.max())
plt.title('Decision Tree Algorithm (testing set)')
plt.xlabel('duration')
plt.ylabel('protocol_type_encoded')
plt.legend()

# Show plot
plt.show()

https://colab.research.google.com/drive/1QkVj8I_GkxQLWkwssl4-iFD1oQmMIZ9Y#scrollTo=51BptnM6_KHL&printMode=true 3/4
3/19/24, 11:44 PM lab7.ipynb - Colaboratory

duration 0
protocol_type 0
attack_type 0
dtype: int64
duration float64
protocol_type object
dtype: object
float64
0
<ipython-input-26-72b12f93fe69>:61: UserWarning: *c* argument looks like a single numeric RGB or RGBA sequence, wh
plt.scatter(x_set[y_set == j, 0], x_set[y_set == j, 1],

https://colab.research.google.com/drive/1QkVj8I_GkxQLWkwssl4-iFD1oQmMIZ9Y#scrollTo=51BptnM6_KHL&printMode=true 4/4

Vts Description Guide Vdep Third Party Solutions
100% (1)
Vts Description Guide Vdep Third Party Solutions
32 pages
Machine Learning Algorithms PDF
100% (1)
Machine Learning Algorithms PDF
148 pages
Pattern Recognition Lab
No ratings yet
Pattern Recognition Lab
24 pages
CS178 Homework #1: Problem 0: Getting Connected
No ratings yet
CS178 Homework #1: Problem 0: Getting Connected
4 pages
About ... Moly-Cop Tools
No ratings yet
About ... Moly-Cop Tools
4 pages
Session 2 Machine Learning Execution
No ratings yet
Session 2 Machine Learning Execution
12 pages
Shobit Sharma (2124399) ML Lab File PDF
No ratings yet
Shobit Sharma (2124399) ML Lab File PDF
19 pages
Data - Preprocessing - Tools - Ipynb - Colaboratory
No ratings yet
Data - Preprocessing - Tools - Ipynb - Colaboratory
4 pages
ML7 - Colab
No ratings yet
ML7 - Colab
3 pages
20MIS1025 - DecisionTree - Ipynb - Colaboratory
No ratings yet
20MIS1025 - DecisionTree - Ipynb - Colaboratory
4 pages
ML Manual With Outputs
No ratings yet
ML Manual With Outputs
30 pages
AIML - ECE304 - Assign-2 - Kartikeya - Kandpal - Ajitesh - S.ipynb - Colab
No ratings yet
AIML - ECE304 - Assign-2 - Kartikeya - Kandpal - Ajitesh - S.ipynb - Colab
3 pages
Data Preprocessing
No ratings yet
Data Preprocessing
9 pages
AIML - ECE304 - Assign-2 - Kartikeya - Kandpal - Ajitesh - S.ipynb - Colab
No ratings yet
AIML - ECE304 - Assign-2 - Kartikeya - Kandpal - Ajitesh - S.ipynb - Colab
4 pages
ML Lab 146
No ratings yet
ML Lab 146
50 pages
Sample Code
No ratings yet
Sample Code
8 pages
Setup: This Notebook Contains All The Sample Code and Solutions To The Exercises in Chapter 3
No ratings yet
Setup: This Notebook Contains All The Sample Code and Solutions To The Exercises in Chapter 3
30 pages
Code and Output of Cancer Detection Model
No ratings yet
Code and Output of Cancer Detection Model
13 pages
Roll NO 2020
No ratings yet
Roll NO 2020
8 pages
List of Imported Libraries
No ratings yet
List of Imported Libraries
12 pages
Ai HW
No ratings yet
Ai HW
7 pages
Stanford KNNassignment
No ratings yet
Stanford KNNassignment
78 pages
Linear Regression (Code)
No ratings yet
Linear Regression (Code)
9 pages
Desicion Tree Ipynb
No ratings yet
Desicion Tree Ipynb
6 pages
LAB-4 Report
No ratings yet
LAB-4 Report
21 pages
Heart Disease Prediction - Colab
No ratings yet
Heart Disease Prediction - Colab
18 pages
DM Practical File
No ratings yet
DM Practical File
21 pages
5b Python Implementation of Decision Tree
No ratings yet
5b Python Implementation of Decision Tree
7 pages
ML Assgnment 1
No ratings yet
ML Assgnment 1
4 pages
Experiment 2.1
No ratings yet
Experiment 2.1
3 pages
Assignment 3
No ratings yet
Assignment 3
6 pages
Assignment 1
No ratings yet
Assignment 1
2 pages
ML Algorithms
100% (1)
ML Algorithms
1 page
Question - 2-Interview Question ML
No ratings yet
Question - 2-Interview Question ML
13 pages
5) Randomforest - Ipynb - Colaboratory
No ratings yet
5) Randomforest - Ipynb - Colaboratory
12 pages
Trafficcc Flow...
No ratings yet
Trafficcc Flow...
29 pages
Is Lab Aman Agarwal PDF
No ratings yet
Is Lab Aman Agarwal PDF
8 pages
B22EE010 Report
No ratings yet
B22EE010 Report
9 pages
Personalized Cancer Diagnosis
No ratings yet
Personalized Cancer Diagnosis
100 pages
Notebook - Main Code
No ratings yet
Notebook - Main Code
4 pages
Sentiment Analysis On Tweets
No ratings yet
Sentiment Analysis On Tweets
2 pages
ML Cheatsheet
No ratings yet
ML Cheatsheet
4 pages
E4 DS203 2023 Sem2
No ratings yet
E4 DS203 2023 Sem2
2 pages
EE331 2024F Assignment1 v2
No ratings yet
EE331 2024F Assignment1 v2
5 pages
Heart: Our "Goal" Predict The Presence of Heart Disease in The Patient
100% (1)
Heart: Our "Goal" Predict The Presence of Heart Disease in The Patient
73 pages
Unit 2
No ratings yet
Unit 2
5 pages
Zainab Pate Data PPF #5 - Colab
No ratings yet
Zainab Pate Data PPF #5 - Colab
10 pages
AIML Practical 02 22105A2021
No ratings yet
AIML Practical 02 22105A2021
8 pages
LSTM - Jupyter Notebook
No ratings yet
LSTM - Jupyter Notebook
7 pages
Scikit Learn Cheat Sheet Python
No ratings yet
Scikit Learn Cheat Sheet Python
1 page
Machine Learning Algorithms (Python & R) PDF
No ratings yet
Machine Learning Algorithms (Python & R) PDF
11 pages
PA Lab2
No ratings yet
PA Lab2
11 pages
Python: Master
No ratings yet
Python: Master
37 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
Lazarus Brookframework Ref
No ratings yet
Lazarus Brookframework Ref
170 pages
Sort Metode Payload
No ratings yet
Sort Metode Payload
7 pages
06 Export From AC 16 To Artlantis Render 4.1 and Artlantis Studio 4.1
No ratings yet
06 Export From AC 16 To Artlantis Render 4.1 and Artlantis Studio 4.1
8 pages
Business Proposal IP-Arnold Empire Pty LTD
No ratings yet
Business Proposal IP-Arnold Empire Pty LTD
14 pages
IBM Replication
No ratings yet
IBM Replication
20 pages
12 Classification
No ratings yet
12 Classification
16 pages
Aashis Kumar Resume
No ratings yet
Aashis Kumar Resume
2 pages
Singer 38413016300
No ratings yet
Singer 38413016300
87 pages
Fenton Stream Function Theory
No ratings yet
Fenton Stream Function Theory
12 pages
Case Study (Oyo Rooms) - UM19252
No ratings yet
Case Study (Oyo Rooms) - UM19252
9 pages
Revised DIT Course 2011
No ratings yet
Revised DIT Course 2011
23 pages
TBC502 Introduction To Artificial Intelligence
No ratings yet
TBC502 Introduction To Artificial Intelligence
2 pages
Arm Vs Intel
No ratings yet
Arm Vs Intel
19 pages
4.profit Maximization
No ratings yet
4.profit Maximization
14 pages
CSharp Permission To Folder
No ratings yet
CSharp Permission To Folder
9 pages
Why Move From P3 To P6?: Karl Prutzer, Product Manager
No ratings yet
Why Move From P3 To P6?: Karl Prutzer, Product Manager
40 pages
This Article Explains Dijkstra
No ratings yet
This Article Explains Dijkstra
4 pages
Documentation and ASCII Archives: Simatic S7
No ratings yet
Documentation and ASCII Archives: Simatic S7
12 pages
CH13 Data Representation A2 QP 2
No ratings yet
CH13 Data Representation A2 QP 2
19 pages
Optimi Data Gateway 6.2 User Guide
No ratings yet
Optimi Data Gateway 6.2 User Guide
36 pages
Solaris Cluster Changing Public IP Addresses or Logical Host IP in Cluster Doc ID 1003630 PDF
No ratings yet
Solaris Cluster Changing Public IP Addresses or Logical Host IP in Cluster Doc ID 1003630 PDF
3 pages
Heron's Formula
No ratings yet
Heron's Formula
2 pages
ZTE EReader (V2.22) User Guide
No ratings yet
ZTE EReader (V2.22) User Guide
46 pages
Lab 01 - OS
No ratings yet
Lab 01 - OS
3 pages
Oracle Database 11g Database Architecture and ASM
No ratings yet
Oracle Database 11g Database Architecture and ASM
44 pages
Self Refferential Structure
No ratings yet
Self Refferential Structure
30 pages
BSC It Dbms Notes
73% (11)
BSC It Dbms Notes
187 pages