saurabh
saurabh
OBJECTIVE-To get the input from user and perform numerical operations
(MAX, MIN, AVG, SUM, SQRT, ROUND) using in R.
Program-
#Create a Vector
> data=c(23,4,56,21,34,56,73)
> #Get the maximum value
> print(max(data))
[1] 73
> #Get the minimum value
> print(min(data))
[1] 4
> #Get the SUM-
> sum(data)
[1] 267
> #Get the AVG-
> print(mean(data))
[1] 38.14286
> #Get the SQRT-
> a=5
> print(sqrt(a))
[1] 2.236068
> a=5.2
> #Get the ROUND-
> print(round(a))
[1] 5
Program-
#.CSV
> read.data<-read.csv("C:/Users/saurabh/OneDrive/Desktop/College
Work/5th-Semester/I.D.A.V Lab/business-financial-data-june-2023-quarter-
csv.csv")
> print(read.data)
#.XLS
> install.packages("readxl")
> library(readxl)
#.TXT
> txt_data <-
read.table("C:/Users/saurabh/OneDrive/Desktop/R_Language.txt", header =
TRUE, sep = "\t")
> print(excel_data)
Sample Output-
CSV FILE-
TXT FILE-
OBJECTIVE- To get the input matrix from user and perform Matrix addition,
subtraction, multiplication, inverse transpose and division operations using
vector concept in R.
Program-
#MATRIX CREATION
> {r = readline("Enter the number of rows:")}
> r = as.integer(r)
>print(M1*M2)
Program-
# DEFINING VECTOR
> a=c(23,84,16,95,23,6,41,29,6,4,6)
#1.MEAN-
> print(mean(a))
#2.MEDIAN-
> print(median(a))
#3.MODE-
> getmode <- function(a) {
uniqv <- unique(a)
uniqv[which.max(tabulate(match(a, uniqv)))]
}
> print(getmode(a))
#4.STANDARD DEVIATION-
> print(sd(a))
Sample Output-
OBJECTIVE- To perform data pre-processing operation (1) Handle mining data (2)
Min-Max normalization
Program-
#Handle Mining Data-
x = c(NA,3,4,NA,NA,NA)
is.na(x)
x = c(NA,3 4,NA,NA,0/0,0/0)
#Min-Max Normlization-
install.packages("caret")
library(caret)
data = data.frame(Var1 = c(120, 345, 145, 522, 596, 285, 21), Var2 = c(10, 15, 45, 22, 53, 28, 12),
Var3 = c(-34, 0.05, 0-15, 0-12, -6, 0·85, 0.11))
>summary (Normalized_My_Data)
Program-
> data("USArrests")
> rawdf <- na.omit(USArrests)
> names(arrests.pca)
> print(arrests.pca)
> summary(arrests.pca)
> pcaCharts(arrests.pca)
Sample Output-
Program-
# Input data
x <- c(1, 2, 3, 4, 5)
y <- c(2, 4, 5, 4, 5)
# Fit a linear regression model
Sample Output-
Program-
# Install and load necessary packages
if(!require(caTools)) install.packages("caTools")
if(!require(ggplot2)) install.packages("ggplot2")
library(caTools)
library(ggplot2)
data <- read.csv("/gender_submission.csv")
# Plot the logistic regression curve - the original plot may not be
relevant
# Plotting 'Survived' against itself for demonstration.
import numpy as np
import pandas as pd
# Load dataset
data = pd.read_csv('/content/Groceries_dataset.csv')
data.drop_duplicates(inplace=True)
data.isnull().sum()
if 'Date' in data.columns:
data['year'] = data['Date'].dt.year
data['month'] = data['Date'].dt.month
data['day'] = data['Date'].dt.day
data['day_name'] = data['Date'].dt.day_name()
# Convert to integer
item_count_pivot = item_count_pivot.astype('int32')
# Apriori Algorithm
basket = item_count.groupby('Transaction')['itemDescription'].apply(list).reset_index()
basket_encoded = basket['itemDescription'].str.join('|').str.get_dummies('|')
frequent_itemsets.sort_values('support', ascending=False).head(10)
Program-
>install.packages(“stats”)
>install.packages(“cluster”)
>install.packages(“ClusterR”)
>library(stats)
>library(cluster)
>library(ClusterR)
> kmeans.re
> kmeans.re$cluster
> cm
+ col = kmeans.re$cluster)
> kmeans.re$centers
+ y_kmeans,
+ lines = 0,
+ shade = TRUE,
+ color = TRUE,
+ labels = 2,
+ plotchar = FALSE,
+ span = TRUE,
+ xlab = 'Sepal.Length',
+ ylab = 'Sepal.Width')
Sample Output-