R Practicals (2007 Version)
R Practicals (2007 Version)
Reg.No :
Name :
Semester :
Year :
Reg.No :
Name :
Sub.Code :
This is to certify that this is the bonafide record of the practical work done in
DATAMINING USING R at St .Mary’s College (Autonomous), during the year 2023-2024,
submitted for the M.Sc. Computer Science Practical Examination held on
at St. Mary’s College (Autonomous), Thoothukudi.
Date: Staff-in-charge
4 07.02.2024 CLASSIFICATION
1. Apriori Algorithm
library(arules)
library(arulesViz)
library(RColorBrewer)
# import dataset
data("Groceries")
inspect(rules[1:10])
type = "relative",
2. K- Means Clustering
set.seed(123)
plot(data$x, data$y, col = "blue", pch = 16, main = "Sample Data for K-Means Clustering")
data$cluster<- kmeans_result$cluster
plot(data$x, data$y, col = data$cluster, pch = 16, main = "K-Means Clustering (K=2)")
cat("Cluster Centers:\n")
print(kmeans_result$centers)
OUTPUT:
3. Hierarchical Clustering
library(dplyr)
head(mtcars)
distance_mat
Hierar_cl
# Plotting dendrogram
plot(Hierar_cl)
fit
table(fit)
OUTPUT:
4. Classification Algorithm
library(party)
# Create the input data frame.
plot(output.tree)
OUTPUT:
5. Decision Tree
library(dataset)
library(caTools)
library(party)
library(dplyr)
library(magrittr)
data("readingSkills")
head(readingSkills)
plot(model)
OUTPUT:
6. Linear Regression
x <-c(151,174,138,186,128,136,179,163,152,131)
y <-c(63,81,56,91,47,57,76,72,62,48)
relation<- lm(y~x)
print(summary(relation))
OUTPUT:
7. Data Visualization
barplot(airquality$Ozone, main = 'Ozone Concenteration in air', xlab = 'ozone levels', horiz = TRUE)
barplot(airquality$Ozone, main = 'Ozone Concenteration in air', xlab = 'ozone levels', col ='blue',
horiz = FALSE)
data(airquality)
hist(airquality$Temp, main ="La Guardia Airport's\ Maximum Temperature(Daily)",
xlab ="Temperature(Fahrenheit)",
xlim = c(50, 125), col ="yellow",
freq = TRUE)
boxplot(airquality[, 0:4],main ='Box Plots for Air Quality Parameters')
boxplot(airquality$Wind, main = "Average wind speed\ at La Guardia Airport",
xlab = "Miles per hour", ylab = "Wind",
col = "orange", border = "brown",
horizontal = TRUE, notch = TRUE)
plot(airquality$Ozone, airquality$Month, main ="Scatterplot Example",
xlab ="Ozone Concentration in parts per billion",
ylab =" Month of observation ",
pch = 19)
OUTPUT: