0% found this document useful (0 votes)

56 views3 pages

RG Inference Code

This document contains code for analyzing a dataset on restaurant marketing campaigns. It loads and cleans the data, checks for missing values and duplicates. It then generates summary statistics, histograms, and bar plots to visualize metrics like pageviews, calls and reservations across treatment groups and restaurant types. Statistical tests like ANOVA and normality tests are also performed to analyze relationships between variables and check distributions. Results are exported to text and image files for reporting.

Uploaded by

Brokin Hart

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

56 views3 pages

RG Inference Code

Uploaded by

Brokin Hart

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

# Author: Shovan Chowdhury

# Reading The data set

d<-[Link]("D:/business analytics/eMDP_BA/EDA_session/RG case/[Link]",header=T)

attach(d)
names(d)
## check the type of all the columns of the dataframe
str(appcab)

##---------------Data Cleaning and Data

Validation-------------------###

## Look for duplicate values in [Link] column as it is the

primary key##

sum(duplicated(d)) ## In the data frame

sum(duplicated(business_id)) ## No duplicate entries found in the primary key

## Look for NA values and missing/blank values in all the columns

[Link](d)
sum([Link](d))
[Link](d)

## Checking for blank values in all the columns of the dataframe

sapply(d, function(x) length(which(x == ""))) # checking for blank "" values; there
are none

#------------exporting results in a text file----------

sink("D:/business analytics/eMDP_BA/EDA_session3/RG case/[Link]")

summary(pageviews[treatment==0])
summary(pageviews[restaurant_type=="chain"])
summary(pageviews[treatment==2 & restaurant_type=="chain"])
sink()

jpeg("D:/business analytics/eMDP_BA/EDA_session3/RG case/[Link]")

par(mfrow=c(1,3))
hist(pageviews[treatment==0])
hist(pageviews[treatment==1])
hist(pageviews[treatment==2])
[Link]()

#---------------- Bar Plots with respect to treatments-----------------

tab_1=tapply(pageviews,treatment,"mean")
tab_2=tapply(calls,treatment,"mean")
tab_3=tapply(reservations,treatment,"mean")

#barplot(tab_1,col=c("red","blue","green"),xlab="Page Views")
barplot(tab_1,col=c("red","blue","green"),xlab="Page
Views",[Link]=c("Control","Treatment 1","Treatment 2"))
barplot(tab_2,col=c("red","blue","green"),xlab="Calls",[Link]=c("Control","Treat
ment 1","Treatment 2"))
barplot(tab_3,col=c("red","blue","green"),xlab="Reservations",[Link]=c("Control"
,"Treatment 1","Treatment 2"))
# Bar Plots with respect to treatments and restaurant type
tab_4=tapply(pageviews,list(treatment,restaurant_type),"mean")
tab_5=tapply(calls,list(treatment,restaurant_type),"mean")
tab_6=tapply(reservations,list(treatment,restaurant_type),"mean")

barplot(tab_4,beside=T,col=c("red","blue","green","red","blue","green"),xlab="Page
Views")
barplot(tab_5,beside=T,col=c("red","blue","green","red","blue","green"),xlab="Calls
")
barplot(tab_6,beside=T,col=c("red","blue","green","red","blue","green"),xlab="Reser
vations")

#-------confirmatory analysis---------------------

# ANOVA
TRT=[Link](treatment)
RT=[Link](restaurant_type)

# One-Way ANOVA Model

mod_1=aov(pageviews~TRT)
summary(mod_1)
#TukeyHSD(mod_1)

mod_2=aov(calls~TRT)
summary(mod_2)
#TukeyHSD(mod_2)

mod_3=aov(reservations~TRT)
summary(mod_3)
#TukeyHSD(mod_3)

# Two-Way ANOVA Model

mod_4=aov(pageviews~TRT*RT)
summary(mod_4)
#TukeyHSD(mod_4)

mod_5=aov(calls~TRT*RT)
summary(mod_5)
#TukeyHSD(mod_5)

mod_6=aov(reservations~TRT*RT)
summary(mod_6)
#TukeyHSD(mod_6)

#-----binomial distribution----------

dbinom(4, size=4, prob=0.2) # P(X=4)

#P(X>=2)
s=0
for(i in 2:4)
s=s+dbinom(i,4,0.2)

# can use CDF

1-pbinom(1,4,0.2)
#--------Poisson distribution---------

dpois(5,lambda=3)

ppois(10,3)

#-------Normal/Gaussian distribution-----

pnorm(20, mean=12, sd=3.2, [Link]=FALSE) # right tail area

pnorm(16, mean=12, sd=3.2, [Link]=TRUE) # left tail area
qnorm(0.9, 12, 3.2) # inverse (to obtain quantile/90th percentile

#-----Normality Check------------------

# Q-Q Plot
qqnorm(reservations)
qqline(reservations, col = "red",lwd=3)

# Formal Test
# Shapiro-Wilk normality test (maximum sample size should be 5000) best test
[Link](reservations)

#Anderson-Darling test

library(nortest)
[Link](reservations)
[Link](calls[treatment==0 & restaurant_type=="chain"])

#------------mean test one sample------------

[Link](calls, alternative = "greater", mu = 35)

[Link](calls, mu = 35)

#---------------two samples test----------------

[Link](calls, reservations, mu = 0, [Link] = 0.95)

DAV Practical 2
No ratings yet
DAV Practical 2
6 pages
R Programming
No ratings yet
R Programming
11 pages
Exp 8 - LM
No ratings yet
Exp 8 - LM
10 pages
ML Exp No 1
No ratings yet
ML Exp No 1
8 pages
Document
No ratings yet
Document
29 pages
Eda Document Longterm
No ratings yet
Eda Document Longterm
10 pages
EDA Report Week2
No ratings yet
EDA Report Week2
15 pages
Data Cleaning R
No ratings yet
Data Cleaning R
16 pages
Data Cleaning and EDA Techniques Guide
No ratings yet
Data Cleaning and EDA Techniques Guide
38 pages
Mastering Exploratory Data Analysis
No ratings yet
Mastering Exploratory Data Analysis
24 pages
DAP Writeups - Merged
No ratings yet
DAP Writeups - Merged
33 pages
Data Analytics Practical
No ratings yet
Data Analytics Practical
6 pages
EDA Basics: Python for Data Analysis
100% (1)
EDA Basics: Python for Data Analysis
30 pages
Preprocessing Code
No ratings yet
Preprocessing Code
11 pages
Data Cleaning
No ratings yet
Data Cleaning
28 pages
Unit 3-5 15 Marks
No ratings yet
Unit 3-5 15 Marks
8 pages
2 Business
No ratings yet
2 Business
13 pages
Deep Learning Ram
No ratings yet
Deep Learning Ram
21 pages
Unit 3-BA
No ratings yet
Unit 3-BA
31 pages
Exploratory Data Analysis-1
No ratings yet
Exploratory Data Analysis-1
10 pages
Advance Stats Assignment
No ratings yet
Advance Stats Assignment
18 pages
Dev Record Aids
No ratings yet
Dev Record Aids
24 pages
Naan Mudhalvan - Google Cloud Data Analytics
No ratings yet
Naan Mudhalvan - Google Cloud Data Analytics
33 pages
Marketing Analytics EDA Insights
No ratings yet
Marketing Analytics EDA Insights
42 pages
04 Data Cleaning in R
No ratings yet
04 Data Cleaning in R
36 pages
People Analytics InSEM
No ratings yet
People Analytics InSEM
11 pages
Eda Indepth
No ratings yet
Eda Indepth
19 pages
Analysis Using Statistical: Introduction & Data Exploration
No ratings yet
Analysis Using Statistical: Introduction & Data Exploration
23 pages
Data Cleaning Using R
No ratings yet
Data Cleaning Using R
5 pages
Exploratory Data Analysis
No ratings yet
Exploratory Data Analysis
19 pages
Unit 4 Notes
No ratings yet
Unit 4 Notes
20 pages
Assignment 2 - Factor Hair
No ratings yet
Assignment 2 - Factor Hair
39 pages
R Functions
No ratings yet
R Functions
8 pages
Data Analysis With R
No ratings yet
Data Analysis With R
72 pages
Practical 1 EDA
No ratings yet
Practical 1 EDA
14 pages
EDA Guide for Data Scientists
No ratings yet
EDA Guide for Data Scientists
22 pages
Python Data Analysis with Numpy & Pandas
No ratings yet
Python Data Analysis with Numpy & Pandas
3 pages
BT1101 Tutorial 3 Part 2
No ratings yet
BT1101 Tutorial 3 Part 2
38 pages
Some Exercises
No ratings yet
Some Exercises
9 pages
QYB - Set Analysis and AGGR Exercises
No ratings yet
QYB - Set Analysis and AGGR Exercises
15 pages
INDEX
No ratings yet
INDEX
16 pages
Guidebook On Exploratory Data Analysis
No ratings yet
Guidebook On Exploratory Data Analysis
27 pages
Part 5
No ratings yet
Part 5
22 pages
Unit 1 DXV
No ratings yet
Unit 1 DXV
28 pages
Excel Data Analysis and Preprocessing Guide
No ratings yet
Excel Data Analysis and Preprocessing Guide
42 pages
Semi-Automated EDA in Python
No ratings yet
Semi-Automated EDA in Python
3 pages
Lesson 3. Data Preparation and Structuring 1 Data Cleaning
No ratings yet
Lesson 3. Data Preparation and Structuring 1 Data Cleaning
36 pages
Machine Learning Project Roadmap
No ratings yet
Machine Learning Project Roadmap
4 pages
R Studio: Scripts, Data Handling & Cleaning
No ratings yet
R Studio: Scripts, Data Handling & Cleaning
25 pages
Eda Lab Manual
No ratings yet
Eda Lab Manual
34 pages
Advanced R Data Analysis Training PDF
100% (1)
Advanced R Data Analysis Training PDF
72 pages
Business Analytics Notes
No ratings yet
Business Analytics Notes
8 pages
DS Exp4
No ratings yet
DS Exp4
4 pages
Machine Learning Transport Analysis
100% (5)
Machine Learning Transport Analysis
42 pages
Matrix, Dataframes, List
No ratings yet
Matrix, Dataframes, List
8 pages
Assessing Data Quality Dimensions
No ratings yet
Assessing Data Quality Dimensions
9 pages
Business Analytics Lab Manual
No ratings yet
Business Analytics Lab Manual
32 pages
FOUND. DATA SCIENCE Practical
No ratings yet
FOUND. DATA SCIENCE Practical
15 pages
Arima
No ratings yet
Arima
12 pages
L24 Quiz Group Meeting Biostatistics PDF
No ratings yet
L24 Quiz Group Meeting Biostatistics PDF
21 pages
STAT 203 Topic 1
No ratings yet
STAT 203 Topic 1
33 pages
Business Statistics End Term Exam (Set 1)
No ratings yet
Business Statistics End Term Exam (Set 1)
5 pages
Statistics and The Scientific Method
No ratings yet
Statistics and The Scientific Method
8 pages
Lapse Rate Analysis Report
No ratings yet
Lapse Rate Analysis Report
9 pages
Gujarati 5e PPT Ch01
100% (1)
Gujarati 5e PPT Ch01
21 pages
MATH 121 Chapter 8 Hypothesis Testing
No ratings yet
MATH 121 Chapter 8 Hypothesis Testing
31 pages
ML Notes (Module-3)
No ratings yet
ML Notes (Module-3)
21 pages
Sampling Distributions in Statistics
No ratings yet
Sampling Distributions in Statistics
17 pages
Econometrics Project
No ratings yet
Econometrics Project
17 pages
Lin RobustInferenceCox 1989
No ratings yet
Lin RobustInferenceCox 1989
6 pages
Math T STPM Sem 3 2018
No ratings yet
Math T STPM Sem 3 2018
2 pages
Mindmap QUANT - M6
No ratings yet
Mindmap QUANT - M6
1 page
Two Way Anova
No ratings yet
Two Way Anova
13 pages
Sufficient Sample Sizes in Multilevel Models
No ratings yet
Sufficient Sample Sizes in Multilevel Models
8 pages
Linear Regression Final Exam
No ratings yet
Linear Regression Final Exam
3 pages
Chapter 05 Generating Random Numbers
No ratings yet
Chapter 05 Generating Random Numbers
45 pages
Analyzed Univariate and Bivariate
No ratings yet
Analyzed Univariate and Bivariate
2 pages
Assignment 1 - ST36252 Testing of Hypothesis
No ratings yet
Assignment 1 - ST36252 Testing of Hypothesis
4 pages
Understanding Statistics and Data Analysis
No ratings yet
Understanding Statistics and Data Analysis
12 pages
Kruskal-Wallis Analysis of Feedback Attitudes
No ratings yet
Kruskal-Wallis Analysis of Feedback Attitudes
4 pages
Machine Learning Mid 1
No ratings yet
Machine Learning Mid 1
4 pages
MCA Question Bank
No ratings yet
MCA Question Bank
33 pages
International Journal of Agricultural and Statistical Sciences
No ratings yet
International Journal of Agricultural and Statistical Sciences
10 pages
Probability and Statistics Essentials
100% (1)
Probability and Statistics Essentials
353 pages
Intelligent Data Analysis: An Introduction
No ratings yet
Intelligent Data Analysis: An Introduction
4 pages
SPSS Uji PH
No ratings yet
SPSS Uji PH
16 pages
Least Squares & Kalman Filter Guide
No ratings yet
Least Squares & Kalman Filter Guide
17 pages
Demand Forecasting Techniques
No ratings yet
Demand Forecasting Techniques
32 pages

RG Inference Code

Uploaded by

RG Inference Code

Uploaded by

# Author: Shovan Chowdhury

# Reading The data set

##---------------Data Cleaning and Data

## Look for duplicate values in [Link] column as it is the

sum(duplicated(d)) ## In the data frame

## Look for NA values and missing/blank values in all the columns

## Checking for blank values in all the columns of the dataframe

#------------exporting results in a text file----------

sink("D:/business analytics/eMDP_BA/EDA_session3/RG case/[Link]")

jpeg("D:/business analytics/eMDP_BA/EDA_session3/RG case/[Link]")

#---------------- Bar Plots with respect to treatments-----------------

# One-Way ANOVA Model

# Two-Way ANOVA Model

dbinom(4, size=4, prob=0.2) # P(X=4)

# can use CDF

pnorm(20, mean=12, sd=3.2, [Link]=FALSE) # right tail area

#------------mean test one sample------------

[Link](calls, alternative = "greater", mu = 35)

#---------------two samples test----------------

[Link](calls, reservations, mu = 0, [Link] = 0.95)

You might also like