0% found this document useful (0 votes)

15 views

DM lab

The document certifies the completion of practical work in a Computer Laboratory for the academic year 2023-2024. It includes various programming tasks such as implementing the Apriori algorithm, K-means and hierarchical clustering, decision tree classification, linear regression, and data visualization using R. Each task is accompanied by sample code and outputs demonstrating the respective techniques.

Uploaded by

anandsb8302

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

15 views

DM lab

Uploaded by

anandsb8302

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 18

This is to certify that the bonafide record of the work done in the

Computer Laboratory during academic year 2023 – 2024.

Name :

Class :

Roll No. :

Lab :

For the practical examination held on ________________

Staff In-Charge Examiners:

Head of the Department 2.

Name :

Roll No. :
Page
S.No Date Title Staff sign
no

Staff Signature:
1)Apriori Algorithm

# Loading Libraries

library(arules)

library(arulesViz)

library(RColorBrewer)

# import dataset

data("Groceries")

# using apriori() function

rules <- apriori(Groceries,

parameter = list(supp = 0.01, conf = 0.2))

# using inspect() function

inspect(rules[1:10])

# using itemFrequencyPlot() function

arules::itemFrequencyPlot(Groceries, topN = 20,

col = brewer.pal(8, 'Pastel2'),

main = 'Relative Item Frequency Plot',

type = "relative",

ylab = "Item Frequency (Relative)")

Output:
2) implement K-means clustering techniques

# Generate a sample dataset

set.seed(123)

data <- data.frame(

X1 = rnorm(100, mean = 10, sd = 2),

X2 = rnorm(100, mean = 20, sd = 3)

# Implement K-means clustering

k <- 3 # Number of clusters

kmeans_result <- kmeans(data, centers = k, nstart = 20)

# Print the cluster centers

print(kmeans_result$centers)

# Print the cluster assignments for each data point

print(kmeans_result$cluster)

# Visualize the original dataset with cluster assignments

plot(data, col = kmeans_result$cluster, main = "K-means Clustering")

points(kmeans_result$centers, col = 1:k, pch = 8, cex = 2)

Output:
3)Hieararchical clustering

# Generate a sample dataset

set.seed(123)

data <- matrix(rnorm(100), ncol = 2)

# Implement hierarchical clustering

hierarchical_result <- hclust(dist(data))

# Cut the dendrogram to get clusters

num_clusters <- 3

clusters <- cutree(hierarchical_result, k = num_clusters)

# Visualize the hierarchical clustering dendrogram

plot(hierarchical_result, main = "Hierarchical Clustering Dendrogram")

# Visualize the clustered data

plot(data, col = clusters, pch = 19, main = "Hierarchical Clustering Results")

Output:
4)implementing classification algorithm

# Load necessary libraries

library(rpart)

library(rpart.plot)

# Load the Iris dataset

data(iris)

# Split the dataset into training and testing sets

set.seed(123)

sample_indices <- sample(1:nrow(iris), 0.7 * nrow(iris))

train_data <- iris[sample_indices, ]

test_data <- iris[-sample_indices, ]

# Build a decision tree classifier

classifier <- rpart(Species ~ ., data = train_data, method = "class")

# Visualize the decision tree

rpart.plot(classifier, main = "Decision Tree Classifier")

# Make predictions on the test set

predictions <- predict(classifier, test_data, type = "class")

# Evaluate the classifier

confusion_matrix <- table(predictions, test_data$Species)

print("Confusion Matrix:")

print(confusion_matrix)
accuracy <- sum(diag(confusion_matrix)) / sum(confusion_matrix)

print(paste("Accuracy:", round(accuracy, 2)))

Output:
5.Decision tree

library(rpart)

library(rpart.plot)

# Load the iris dataset

data(iris)

# Build the decision tree model

tree <- rpart(Species ~ ., data = iris, method = "class")

# Plot the decision tree

rpart.plot(tree, extra = 106)

Output:
6)Linear regression

# Generate a sample dataset

set.seed(123)

x <- rnorm(100, mean = 10, sd = 2)

y <- 3 * x + rnorm(100, mean = 0, sd = 3)

# Create a data frame

data <- data.frame(x = x, y = y)

# Implement linear regression

linear_model <- lm(y ~ x, data = data)

# Print the summary of the linear regression model

print(summary(linear_model))

# Visualize the linear regression line

plot(x, y, main = "Linear Regression", xlab = "X", ylab = "Y")

abline(linear_model, col = "red")

Output:
7) Data visualization

# Install and load ggplot2 library

if (!requireNamespace("ggplot2", quietly = TRUE)) {
install.packages("ggplot2")
}
library(ggplot2)

# Load the mtcars dataset

data(mtcars)

# Create a scatter plot of mpg (miles per gallon) vs. hp (horsepower)

ggplot(mtcars, aes(x = hp, y = mpg)) +
geom_point() +
labs(title = "Scatter Plot of MPG vs. Horsepower",
x = "Horsepower",
y = "Miles per Gallon")
Output:

Apache Cassandra Administrator Associate - Exam Practice Tests
From Everand
Apache Cassandra Administrator Associate - Exam Practice Tests
Cristian Scutaru
No ratings yet
Communication Plan Template
75% (4)
Communication Plan Template
19 pages
Masterlist-Public Sec - Cavite PDF
No ratings yet
Masterlist-Public Sec - Cavite PDF
2 pages
Democratic Socialist Republic of Sri Lanka Pollution Control and Reduction of Environmental Burden in Solid Waste Management (Reeb Waste)
No ratings yet
Democratic Socialist Republic of Sri Lanka Pollution Control and Reduction of Environmental Burden in Solid Waste Management (Reeb Waste)
276 pages
R_language Lab Manual_pg 2024
No ratings yet
R_language Lab Manual_pg 2024
29 pages
R Practicals (2007 Version)
No ratings yet
R Practicals (2007 Version)
15 pages
R Lab Program
No ratings yet
R Lab Program
20 pages
Datamining Lab Record
No ratings yet
Datamining Lab Record
36 pages
R Lab Manual (1)_merged
No ratings yet
R Lab Manual (1)_merged
25 pages
R- language
No ratings yet
R- language
23 pages
WEEK
No ratings yet
WEEK
17 pages
Data Science Project
No ratings yet
Data Science Project
31 pages
R lab Manual
No ratings yet
R lab Manual
22 pages
Final Data Lab
No ratings yet
Final Data Lab
21 pages
Da Exp9,10
No ratings yet
Da Exp9,10
9 pages
R record-1
No ratings yet
R record-1
53 pages
datamininganddataware
No ratings yet
datamininganddataware
25 pages
Datamining 2
No ratings yet
Datamining 2
54 pages
Record
No ratings yet
Record
23 pages
model_lab[1]
No ratings yet
model_lab[1]
6 pages
Week 10 Abhishek Srivastava VFinal
No ratings yet
Week 10 Abhishek Srivastava VFinal
14 pages
R Lab File Deepak
No ratings yet
R Lab File Deepak
27 pages
Agniva
No ratings yet
Agniva
16 pages
DSR LAB MANUAL - 10 programs
No ratings yet
DSR LAB MANUAL - 10 programs
34 pages
CART (2)
No ratings yet
CART (2)
2 pages
ISYE6501-Homework-2
No ratings yet
ISYE6501-Homework-2
11 pages
Aman DA 111
No ratings yet
Aman DA 111
14 pages
1
No ratings yet
1
19 pages
Part a r Programming
No ratings yet
Part a r Programming
10 pages
bi 5to 8
No ratings yet
bi 5to 8
6 pages
datamining
No ratings yet
datamining
20 pages
BDA MSC It
No ratings yet
BDA MSC It
35 pages
R Assignment
No ratings yet
R Assignment
8 pages
Data Science Lab Manual
No ratings yet
Data Science Lab Manual
40 pages
R Practicals
No ratings yet
R Practicals
32 pages
ds
No ratings yet
ds
2 pages
Janani Prakash Loan Prediction Study
No ratings yet
Janani Prakash Loan Prediction Study
97 pages
Practical 3 2022
No ratings yet
Practical 3 2022
8 pages
Toc ch1
No ratings yet
Toc ch1
9 pages
Prerequisites: R Installation
No ratings yet
Prerequisites: R Installation
11 pages
CASOS
No ratings yet
CASOS
12 pages
EXP 1B DAV
No ratings yet
EXP 1B DAV
4 pages
Big Data Analytics Programs Only
No ratings yet
Big Data Analytics Programs Only
22 pages
Dav Pracs
No ratings yet
Dav Pracs
9 pages
Sol Forests
No ratings yet
Sol Forests
5 pages
ds (1)
No ratings yet
ds (1)
2 pages
R Commands
No ratings yet
R Commands
18 pages
Data Science Machine Leraning222
No ratings yet
Data Science Machine Leraning222
11 pages
4063 Final复习资料
No ratings yet
4063 Final复习资料
6 pages
Ida PDF
No ratings yet
Ida PDF
62 pages
Digital Assignment-6: Read The Data
No ratings yet
Digital Assignment-6: Read The Data
30 pages
Final Cost Practical
No ratings yet
Final Cost Practical
29 pages
R-course_part7-ML_exercise-sheet-2024
No ratings yet
R-course_part7-ML_exercise-sheet-2024
8 pages
Session Set Working Directory Choose Directlry
No ratings yet
Session Set Working Directory Choose Directlry
17 pages
R Pgms 30
No ratings yet
R Pgms 30
6 pages
R Lab
No ratings yet
R Lab
15 pages
Analysis Using Statistical: Introduction & Data Exploration
No ratings yet
Analysis Using Statistical: Introduction & Data Exploration
23 pages
ML Lab File
No ratings yet
ML Lab File
43 pages
COST - JournalPracticals (1-7)
No ratings yet
COST - JournalPracticals (1-7)
22 pages
Lab Manual
No ratings yet
Lab Manual
7 pages
saurabh
No ratings yet
saurabh
22 pages
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
From Everand
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
Manish Soni
No ratings yet
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
Test Paper 1 - Pronunciation
No ratings yet
Test Paper 1 - Pronunciation
2 pages
Bio-Control Agents - Bioinsecticides and Bioherbicides
No ratings yet
Bio-Control Agents - Bioinsecticides and Bioherbicides
7 pages
Tamatoa Tamatoa: Actions
No ratings yet
Tamatoa Tamatoa: Actions
1 page
Letter of Credit: Checklist of Requirements and Sample Language
100% (2)
Letter of Credit: Checklist of Requirements and Sample Language
7 pages
Band Skill Experience Range Sbu-Vbu - Cbu Name
No ratings yet
Band Skill Experience Range Sbu-Vbu - Cbu Name
12 pages
Matrix: From: Mccormick - Northwestern.edu
No ratings yet
Matrix: From: Mccormick - Northwestern.edu
6 pages
Pola Perilaku Konsumsi Generasi Millenial Terhadap Produk Fashion Perspektif Monzer Kahf: Studi Kasus Mahasiswi Universitas Airlangga
No ratings yet
Pola Perilaku Konsumsi Generasi Millenial Terhadap Produk Fashion Perspektif Monzer Kahf: Studi Kasus Mahasiswi Universitas Airlangga
13 pages
CLB-1
No ratings yet
CLB-1
1 page
Data Manual: PCI2050B
No ratings yet
Data Manual: PCI2050B
88 pages
Role of Rbi in Controlling Inflation
67% (3)
Role of Rbi in Controlling Inflation
13 pages
EEE436 Lecture Slide 5
No ratings yet
EEE436 Lecture Slide 5
14 pages
Introduction To Stiffness Method
100% (1)
Introduction To Stiffness Method
14 pages
Educational Statistics EDU 408
No ratings yet
Educational Statistics EDU 408
4 pages
Australian Professional Standards For Teachers
No ratings yet
Australian Professional Standards For Teachers
32 pages
Q.1) Distinguish Between Decisions Under Uncertainty and Under Risk For An Appropriate Decision Analysis
No ratings yet
Q.1) Distinguish Between Decisions Under Uncertainty and Under Risk For An Appropriate Decision Analysis
17 pages
A-VA06-103A Attic Plan
No ratings yet
A-VA06-103A Attic Plan
1 page
Angono Petroglyphs: Ethnic Tradition
No ratings yet
Angono Petroglyphs: Ethnic Tradition
5 pages
Ex: MIED Loan Applicatian Form
No ratings yet
Ex: MIED Loan Applicatian Form
8 pages
Japan - Manga & Hentai Anime' (Mature Audience)
0% (1)
Japan - Manga & Hentai Anime' (Mature Audience)
15 pages
The Formation of The Solar System: Our Theory Must Explain The Data
100% (1)
The Formation of The Solar System: Our Theory Must Explain The Data
30 pages
File For Mba
No ratings yet
File For Mba
5 pages
Cracking the AP World History Exam 2019 Premium Edition Princeton Review instant download
100% (2)
Cracking the AP World History Exam 2019 Premium Edition Princeton Review instant download
37 pages
Schematic Diagram: Samsung Electronics 7-1 This Document Can Not Be Used Without Samsung's Authorization
No ratings yet
Schematic Diagram: Samsung Electronics 7-1 This Document Can Not Be Used Without Samsung's Authorization
8 pages
Tiny LEGO Wonders Build 40 Surprisingly Realistic Mini Models 1st Edition Zamboni instant download
100% (1)
Tiny LEGO Wonders Build 40 Surprisingly Realistic Mini Models 1st Edition Zamboni instant download
64 pages
Map Structural Symbols: Mesoscopic Structures
No ratings yet
Map Structural Symbols: Mesoscopic Structures
4 pages
PD 1096 National Building Code
No ratings yet
PD 1096 National Building Code
107 pages
Atrial Fibrillation Pharmacotherapy Review V5
No ratings yet
Atrial Fibrillation Pharmacotherapy Review V5
1 page

DM lab

Uploaded by

DM lab

Uploaded by

This is to certify that the bonafide record of the work done in the

Computer Laboratory during academic year 2023 – 2024.

For the practical examination held on ________________

Staff In-Charge Examiners:

Head of the Department 2.

# using apriori() function

rules <- apriori(Groceries,

parameter = list(supp = 0.01, conf = 0.2))

# using inspect() function

# using itemFrequencyPlot() function

arules::itemFrequencyPlot(Groceries, topN = 20,

col = brewer.pal(8, 'Pastel2'),

main = 'Relative Item Frequency Plot',

ylab = "Item Frequency (Relative)")

# Generate a sample dataset

data <- data.frame(

X1 = rnorm(100, mean = 10, sd = 2),

X2 = rnorm(100, mean = 20, sd = 3)

# Implement K-means clustering

k <- 3 # Number of clusters

kmeans_result <- kmeans(data, centers = k, nstart = 20)

# Print the cluster centers

# Print the cluster assignments for each data point

# Visualize the original dataset with cluster assignments

plot(data, col = kmeans_result$cluster, main = "K-means Clustering")

points(kmeans_result$centers, col = 1:k, pch = 8, cex = 2)

# Generate a sample dataset

data <- matrix(rnorm(100), ncol = 2)

# Implement hierarchical clustering

hierarchical_result <- hclust(dist(data))

# Cut the dendrogram to get clusters

clusters <- cutree(hierarchical_result, k = num_clusters)

# Visualize the hierarchical clustering dendrogram

plot(hierarchical_result, main = "Hierarchical Clustering Dendrogram")

# Visualize the clustered data

plot(data, col = clusters, pch = 19, main = "Hierarchical Clustering Results")

# Load necessary libraries

# Load the Iris dataset

# Split the dataset into training and testing sets

sample_indices <- sample(1:nrow(iris), 0.7 * nrow(iris))

train_data <- iris[sample_indices, ]

test_data <- iris[-sample_indices, ]

# Build a decision tree classifier

classifier <- rpart(Species ~ ., data = train_data, method = "class")

# Visualize the decision tree

rpart.plot(classifier, main = "Decision Tree Classifier")

# Make predictions on the test set

predictions <- predict(classifier, test_data, type = "class")

# Evaluate the classifier

confusion_matrix <- table(predictions, test_data$Species)

print(paste("Accuracy:", round(accuracy, 2)))

# Load the iris dataset

# Build the decision tree model

tree <- rpart(Species ~ ., data = iris, method = "class")

# Plot the decision tree

rpart.plot(tree, extra = 106)

# Generate a sample dataset

x <- rnorm(100, mean = 10, sd = 2)

y <- 3 * x + rnorm(100, mean = 0, sd = 3)

# Create a data frame

data <- data.frame(x = x, y = y)

# Implement linear regression

linear_model <- lm(y ~ x, data = data)

# Print the summary of the linear regression model

# Visualize the linear regression line

plot(x, y, main = "Linear Regression", xlab = "X", ylab = "Y")

abline(linear_model, col = "red")

# Install and load ggplot2 library

# Load the mtcars dataset

# Create a scatter plot of mpg (miles per gallon) vs. hp (horsepower)

You might also like