0% found this document useful (0 votes)

14 views9 pages

Toc ch1

The document contains code for performing various statistical analyses in R including principal component analysis, k-means clustering, hierarchical clustering, hypothesis testing, time series analysis, linear regression, ANOVA, and data visualization techniques like histograms, dot plots, and bar plots using the built-in mtcars dataset. Various packages are also loaded and functions used to conduct the analyses and visualize the results.

Uploaded by

Sahil Shete

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

14 views9 pages

Toc ch1

Uploaded by

Sahil Shete

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 9

1.

Pca

data("iris")

head(iris)

summary(iris)

library()

"to find principal component"

mypr<-prcomp(iris[,-5],scale=T)

"to understand use of scale"

plot(iris$Sepal.Length,iris$Sepal.Width)

plot(scale(iris$Sepal.Length),scale(iris$Sepal.Width))

mypr

summary(mypr)

plot(mypr,type="l")

biplot(mypr,scale=0)

"extract pc scores"

str(mypr)

mypr$x

iris2<-cbind(iris,mypr$x[,1:2])

head(iris2)

cor(iris[,-5],iris2[,6:7])

"End of prog"

install.packages("pls")

library(pls)

names(iris)

pcmodel<-pcr(Sepal.Length~Species+Sepal.Width+Petal.Length+Petal.Width,ncomp=3,data=iris,scale=T)

iris$pred<-predict(pcmodel,iris,ncomp = 2)

head(iris)
2. "k-means clustering "

data("iris")

names(iris)

new_data<-subset(iris,select = c(-Species))

new_data

cl<-kmeans(new_data,3)

data <- new_data

wss <- sapply(1:15,

function(k){kmeans(data, k )$tot.withinss})

wss

plot(1:15, wss,

type="b", pch = 19, frame = FALSE,

xlab="Number of clusters K",

ylab="Total within-clusters sum of squares")

install.packages("cluster")

library(cluster)

clusplot(new_data, cl$cluster, color=TRUE, shade=TRUE,

labels=2, lines=0)

cl$cluster

cl$centers

3. "agglomarative clustering "

clusters <- hclust(dist(iris[, 3:4]))

plot(clusters)

clusterCut <- cutree(clusters, 3)

table(clusterCut, iris$Species)

ggplot(iris, aes(Petal.Length, Petal.Width, color = iris$Species)) +

geom_point(alpha = 0.4, size = 3.5) + geom_point(col = clusterCut) +

scale_color_manual(values = c('black', 'red', 'green'))

clusters <- hclust(dist(iris[, 3:4]), method = 'average')

clusterCut1 <- cutree(clusters, 3)

table(clusterCut1, iris$Species)

plot(clusters)

ggplot(iris, aes(Petal.Length, Petal.Width, color = iris$Species)) +

geom_point(alpha = 0.4, size = 3.5) + geom_point(col = clusterCut1) +

scale_color_manual(values = c('black', 'red', 'green'))

4. //hypothesis//

dataf<-seq(1,20,by=1)

dataf

mean(dataf)

sd(dataf)

a<-t.test(dataf,alternative="two.sided",mu=10,conf.int=0.95)

5. //time series//

data("AirPassengers")

class(AirPassengers)

start(AirPassengers)

end(AirPassengers)

frequency(AirPassengers)

summary(AirPassengers)

plot(AirPassengers)

abline(reg=lm(AirPassengers~time(AirPassengers)))

cycle(AirPassengers)

plot(aggregate(AirPassengers,FUN=mean))

boxplot(AirPassengers~cycle(AirPassengers))
6. Linear regression

height<-c(102,117,105,141,135,115,138)

weight<-c(61,46,62,54,60,69,51)

student<-lm(weight~height)

student

predict (student,data.frame(height=119),interval="confidence)

plot(student)

ftest<-read.csv(file.choose(),sep=",",header=T)

var.test(ftest$time_g1,ftest$time_g2,alternative = "two.sided")

"one way anova"

data1<-read.csv(file.choose(),sep = ",",header = T)

names(data1)

summary(data1)

head(data1)

anv<-aov(formula = satindex~dept,data=data1)

summary(anv)

8. "two way anova"

data2<-read.csv(file.choose(),sep=",",header = T)

names(data2)

summary(data2)

anv1<-aov(formula = satindex~ dept+exp+dept*exp,data = data2)

summary(anv1)
Practical No :
Aim: Implement regression in R

Code:

attach(mtcars)

plot(wt,mpg)

abline(lm(mpg~wt))

title("Regression of MPG on weight")

Output:

Practical No:
Aim:

Code

Histogram

hist(mtcars$mpg)

hist(mtcars$mpg, breaks = 20, col = "green")

Output:

DotChart

Code:
dotchart(mtcars$mpg,labels = row.names(mtcars),cex = .7,

main="Gas MIlage for Car Models",

xlab = "Miles Per Gallon")

Output:

Barplot

Code

counts<-table(mtcars$gear)

barplot(counts, main="Car Distribution",xlab = "Number of Gears")

output:
Code:

counts<-table(mtcars$gear)

barplot(counts, main="Car Distribution", horiz = TRUE,

names.arg = c("3 Gears","4 Gears", "5 Gears"))

output:

Code:

counts<-table(mtcars$vs,mtcars$gear)

barplot(counts,main = "Car distribution by Gears and VS",

xlab = "Number of gears", col =c("darkblue","red"),

legend= rownames(counts))

output:

ASK (G) Kelompok 4 - Pertemuan 9
No ratings yet
ASK (G) Kelompok 4 - Pertemuan 9
13 pages
DATAMINING
No ratings yet
DATAMINING
24 pages
Bi 5to 8
No ratings yet
Bi 5to 8
6 pages
R Lab Program
No ratings yet
R Lab Program
20 pages
Data Science
No ratings yet
Data Science
15 pages
Da 06-10
No ratings yet
Da 06-10
14 pages
WEEK
No ratings yet
WEEK
17 pages
Ds
No ratings yet
Ds
2 pages
Ds
No ratings yet
Ds
2 pages
Datamining Lab Record
No ratings yet
Datamining Lab Record
36 pages
File 2
No ratings yet
File 2
17 pages
Final Data Lab
No ratings yet
Final Data Lab
21 pages
Data Scinece Practical File
No ratings yet
Data Scinece Practical File
23 pages
File 2
No ratings yet
File 2
17 pages
Da Thoery
No ratings yet
Da Thoery
24 pages
Aman DA 111
No ratings yet
Aman DA 111
14 pages
BDA Lab Manual (12 Weeks)
No ratings yet
BDA Lab Manual (12 Weeks)
22 pages
Datamininganddataware
No ratings yet
Datamininganddataware
25 pages
HW11數學規劃
No ratings yet
HW11數學規劃
14 pages
Final Data Lab
No ratings yet
Final Data Lab
20 pages
Shahun Term Workr1
No ratings yet
Shahun Term Workr1
34 pages
R - Language Lab Manual - PG 2024
No ratings yet
R - Language Lab Manual - PG 2024
29 pages
DM Lab
No ratings yet
DM Lab
18 pages
Ds Paper
No ratings yet
Ds Paper
35 pages
Department Of: Computer Science & Engineering
No ratings yet
Department Of: Computer Science & Engineering
4 pages
Kmeans.R: Finding The Elbow' in Wss Curve
No ratings yet
Kmeans.R: Finding The Elbow' in Wss Curve
4 pages
DS File Et C1 23
No ratings yet
DS File Et C1 23
15 pages
Week 10 Abhishek Srivastava VFinal
No ratings yet
Week 10 Abhishek Srivastava VFinal
14 pages
Data Cleaning
No ratings yet
Data Cleaning
4 pages
Clustering R Codes
No ratings yet
Clustering R Codes
2 pages
Record
No ratings yet
Record
23 pages
R Practicals (2007 Version)
No ratings yet
R Practicals (2007 Version)
15 pages
Final ML File
No ratings yet
Final ML File
34 pages
BAN5
No ratings yet
BAN5
2 pages
MicroArray Analysis - 201
No ratings yet
MicroArray Analysis - 201
13 pages
R Lab Manual (1) - Merged
No ratings yet
R Lab Manual (1) - Merged
25 pages
Datamining
No ratings yet
Datamining
20 pages
K-Means Cluter Analysis For IRIS Data Frame in R
No ratings yet
K-Means Cluter Analysis For IRIS Data Frame in R
3 pages
R Record-1
No ratings yet
R Record-1
53 pages
ISYE6501 Homework 2
No ratings yet
ISYE6501 Homework 2
11 pages
Datamining 2
No ratings yet
Datamining 2
54 pages
FDS DW Journal
No ratings yet
FDS DW Journal
28 pages
R Practicals
No ratings yet
R Practicals
32 pages
R Lab Manual
No ratings yet
R Lab Manual
22 pages
Model Lab
No ratings yet
Model Lab
6 pages
ISYE 6501 Georgia Tech hmwk4.2
No ratings yet
ISYE 6501 Georgia Tech hmwk4.2
4 pages
Kmean PGM
No ratings yet
Kmean PGM
3 pages
R Course
No ratings yet
R Course
7 pages
Rlab
No ratings yet
Rlab
7 pages
Data Science Project
No ratings yet
Data Science Project
31 pages
Assigmnent 3 (Data Mining)
No ratings yet
Assigmnent 3 (Data Mining)
18 pages
R Code For Discriminant and Cluster Analysis
No ratings yet
R Code For Discriminant and Cluster Analysis
23 pages
CASOS
No ratings yet
CASOS
12 pages
R Codes
No ratings yet
R Codes
5 pages
Anuj Khandelwal 3029 BCP A Business Analytics Continuous Assessment 2
No ratings yet
Anuj Khandelwal 3029 BCP A Business Analytics Continuous Assessment 2
20 pages
Solution HW2
No ratings yet
Solution HW2
6 pages
Experiment 6
No ratings yet
Experiment 6
7 pages
Codes
No ratings yet
Codes
8 pages
TensorFlow深度学习项目实战: Chinese Edition
From Everand
TensorFlow深度学习项目实战: Chinese Edition
Posts & Telecom Press
No ratings yet
Lisp Programming Language
From Everand
Lisp Programming Language
Faiz ul haque Zeya
No ratings yet
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
From Everand
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
Manish Soni
No ratings yet
Diagonalization Notes
No ratings yet
Diagonalization Notes
20 pages
Principal Component Analysis - A Tutorial
No ratings yet
Principal Component Analysis - A Tutorial
37 pages
Practica - Dirigida - 2 - Algebra Lineal PDF
No ratings yet
Practica - Dirigida - 2 - Algebra Lineal PDF
8 pages
Generalized Eigenvalue
No ratings yet
Generalized Eigenvalue
13 pages
Surat Cerai PDF
No ratings yet
Surat Cerai PDF
23 pages
8a Solving Matrix Quadratic Equations
No ratings yet
8a Solving Matrix Quadratic Equations
3 pages
AL S15 Lab
No ratings yet
AL S15 Lab
6 pages
AdvancedSensorySystems 3b SVD
No ratings yet
AdvancedSensorySystems 3b SVD
13 pages
Matrix Decomposition Chap1
No ratings yet
Matrix Decomposition Chap1
9 pages
Solution Manual Aljabar Linear
No ratings yet
Solution Manual Aljabar Linear
8 pages
As Quiz 3 PCA Solution PDF
100% (1)
As Quiz 3 PCA Solution PDF
1 page
Linear Algebra: Lecture Notes
No ratings yet
Linear Algebra: Lecture Notes
47 pages
Manual Jan 5000
No ratings yet
Manual Jan 5000
65 pages
Assignment On Matrix and Linear Algebra: Eigen Value: Sunjida Haque
No ratings yet
Assignment On Matrix and Linear Algebra: Eigen Value: Sunjida Haque
25 pages
LU Decomposition
No ratings yet
LU Decomposition
3 pages
Mat PROJEKT MAT 1 PDF
No ratings yet
Mat PROJEKT MAT 1 PDF
10 pages
04 Jun 2021 MATHEMATICS-II
No ratings yet
04 Jun 2021 MATHEMATICS-II
12 pages
Test Exam 2
No ratings yet
Test Exam 2
17 pages
CASA Statement Feb2025 03032025211618 PDF
No ratings yet
CASA Statement Feb2025 03032025211618 PDF
16 pages
PCA PDF 1646672241
No ratings yet
PCA PDF 1646672241
11 pages
KREYSZIG 10E (update版) -Errata CH1~CH18 小本 PDF
No ratings yet
KREYSZIG 10E (update版) -Errata CH1~CH18 小本 PDF
18 pages
F1g121089-Yulinar (Makalah Aljabar Linear)
No ratings yet
F1g121089-Yulinar (Makalah Aljabar Linear)
17 pages
CIVL Pablo Hurtado Assignment
No ratings yet
CIVL Pablo Hurtado Assignment
4 pages
Practical 5: LU Decomposition Method
No ratings yet
Practical 5: LU Decomposition Method
4 pages
Homework Eigen-With Answers
No ratings yet
Homework Eigen-With Answers
7 pages
Final
No ratings yet
Final
3 pages
PCA V V Imp Principal Component Analysis 4 Dummies ..
No ratings yet
PCA V V Imp Principal Component Analysis 4 Dummies ..
15 pages
Math-803-Lecture 19-Matrix - Approx - PCA
No ratings yet
Math-803-Lecture 19-Matrix - Approx - PCA
17 pages
Exercises On LU Factorization
No ratings yet
Exercises On LU Factorization
1 page

Toc ch1

Uploaded by

Toc ch1

Uploaded by

1.

"to find principal component"

"to understand use of scale"

data <- new_data

wss <- sapply(1:15,

type="b", pch = 19, frame = FALSE,

xlab="Number of clusters K",

ylab="Total within-clusters sum of squares")

clusplot(new_data, cl$cluster, color=TRUE, shade=TRUE,

3. "agglomarative clustering "

clusters <- hclust(dist(iris[, 3:4]))

clusterCut <- cutree(clusters, 3)

ggplot(iris, aes(Petal.Length, Petal.Width, color = iris$Species)) +

geom_point(alpha = 0.4, size = 3.5) + geom_point(col = clusterCut) +

scale_color_manual(values = c('black', 'red', 'green'))

clusterCut1 <- cutree(clusters, 3)

ggplot(iris, aes(Petal.Length, Petal.Width, color = iris$Species)) +

geom_point(alpha = 0.4, size = 3.5) + geom_point(col = clusterCut1) +

scale_color_manual(values = c('black', 'red', 'green'))

"one way anova"

8. "two way anova"

anv1<-aov(formula = satindex~ dept+exp+dept*exp,data = data2)

title("Regression of MPG on weight")

hist(mtcars$mpg, breaks = 20, col = "green")

main="Gas MIlage for Car Models",

xlab = "Miles Per Gallon")

barplot(counts, main="Car Distribution",xlab = "Number of Gears")

barplot(counts, main="Car Distribution", horiz = TRUE,

names.arg = c("3 Gears","4 Gears", "5 Gears"))

barplot(counts,main = "Car distribution by Gears and VS",

xlab = "Number of gears", col =c("darkblue","red"),

You might also like