0% found this document useful (0 votes)

17 views4 pages

HW 1 Math 380 R Code

This document contains R code that performs various exploratory data analyses and statistical summaries on pizza delivery data. The code loads CSV data, calculates summary statistics like means, medians, and quartiles, creates plots like histograms, bar plots, box plots, and QQ plots to visualize distributions and outliers, and groups and summarizes delivery time data. Overall, the code conducts a comprehensive exploratory analysis to understand patterns in pizza delivery times and temperatures.

Uploaded by

Tyrome Madkins

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

17 views4 pages

HW 1 Math 380 R Code

Uploaded by

Tyrome Madkins

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 4

# 2.

6
# (a) Set the working directory
setwd("C:/Users/tyrom/OneDrive/Documents")

# Read the CSV data

pizza_data <- read.csv("pizza_delivery.csv")

# Extract the temperature data

temperature <- pizza_data$temperature

# Create a histogram
hist(temperature, col = "yellow", main = "Pizza Temperature", freq = FALSE)

# Add a vertical line at 65 degrees

lines(c(65, 65), c(0, 1), lty = 2, col = "blue")

#2.6
# (b) Set the working directory
setwd("C:/Users/tyrom/OneDrive/Documents")

# Read the CSV data

pizzadelivery <- read.csv("pizza_delivery.csv")

# Load the ggplot2 library

library(ggplot2)

# Create a histogram plot

ggplot(data = pizzadelivery, mapping = aes(x = temperature)) +
geom_histogram(binwidth = 2.5, col = "darkgrey") +
# Set the y-axis label and customize the scale
labs(y = "Frequency") +
scale_y_continuous("Frequency", limits = c(0, 200), breaks = seq(0, 200, 10))

#2.6
# (c)Set the working directory
setwd("C:/Users/tyrom/OneDrive/Documents")

# Read the CSV data

pizza_data <- read.csv("pizza_delivery.csv")

# Extract the driver variable

driver <- pizza_data$driver

# Create a barplot to visualize the number of deliveries by driver

barplot(table(driver), xlab = "Delivery Driver", ylab = "Number of Deliveries", col
= "green")

# (d) Set the working directory

setwd("C:/Users/tyrom/OneDrive/Documents")

# Read the CSV file

pizzadelivery <- read.csv("pizza_delivery.csv")

# Load the ggplot2 library

library(ggplot2)
# Define the order and colors for days of the week
gray_colors <- c(
"Monday" = "gray10",
"Tuesday" = "gray20",
"Wednesday" = "gray30",
"Thursday" = "gray40",
"Friday" = "gray50",
"Saturday" = "gray60",
"Sunday" = "gray70"
)

# Reorder the levels of the "day" variable in descending order

pizzadelivery$day <- factor(pizzadelivery$day, levels = rev(names(gray_colors)))

# Create the bar chart using qplot

qplot(data = pizzadelivery, x = driver, fill = day, geom = "bar", xlab = "Driver",
ylab = "Number of Deliveries") +
scale_fill_manual(values = gray_colors) +
theme_bw()

#3.1
# Data Sets
distance <- c(12.5, 29.9, 14.8, 18.7, 7.6, 16.2, 16.5, 27.4, 12.1, 17.5)
altitude <- c(342, 1245, 502, 555, 398, 670, 796, 912, 238, 466)

# (a) Calculate the arithmetic mean and median for both distance and altitude.
mean_distance <- mean(distance)
median_distance <- median(distance)
mean_altitude <- mean(altitude)
median_altitude <- median(altitude)

# Print results
cat("Distance Mean:", mean_distance, "\n")
cat("Distance Median:", median_distance, "\n")
cat("Altitude Mean:", mean_altitude, "\n")
cat("Altitude Median:", median_altitude, "\n")

# (b) Determine the first and third quartiles for both distance and altitude.
quartiles_distance <- quantile(distance, probs = c(0.25, 0.75), type = 2)
quartiles_altitude <- quantile(altitude, probs = c(0.25, 0.75), type = 2)

# Print results
cat("Distance Quartiles (Q1, Q3):", quartiles_distance[1], ",",
quartiles_distance[2], "\n")
cat("Altitude Quartiles (Q1, Q3):", quartiles_altitude[1], ",",
quartiles_altitude[2], "\n")

# (c) Calculate the interquartile range (IQR), absolute median deviation, and
standard deviation for both variables.
iqr_distance <- diff(quartiles_distance)
amd_distance <- mad(distance)
sd_distance <- sd(distance)

iqr_altitude <- diff(quartiles_altitude)

amd_altitude <- mad(altitude)
sd_altitude <- sd(altitude)

# Print Results
cat("Distance IQR:", iqr_distance, "\n")
cat("Altitude IQR:", iqr_altitude, "\n")
cat("Distance Absolute Median Deviation:", amd_distance, "\n")
cat("Altitude Absolute Median Deviation:", amd_altitude, "\n")
cat("Distance Standard Deviation:", sd_distance, "\n")
cat("Altitude Standard Deviation:", sd_altitude, "\n")

# (e) Draw and interpret the box plot for both distance and altitude.
boxplot(distance, main = "Box Plot - Distance", ylab = "Distance")
boxplot(altitude, main = "Box Plot - Altitude", ylab = "Altitude")

# (f) Summarize grouped data for distance and calculate the weighted arithmetic
mean and median.
grouped_data <- data.frame(
Distance_Group = c("Short", "Moderate", "Long"),
Frequency = c(
sum(distance >= 5 & distance <= 15),
sum(distance > 15 & distance <= 20),
sum(distance > 20 & distance <= 30)
)
)

# Calculate the weighted mean for distance

midpoints <- c(10, 17.5, 25)
total_frequency <- sum(grouped_data$Frequency)
weighted_mean_distance <- sum(midpoints * grouped_data$Frequency) / total_frequency

# Calculate the weighted median for distance (assuming equal distribution within
each class)
weighted_median_distance <- midpoints[which(cumsum(grouped_data$Frequency) >=
total_frequency / 2)[1]]

# Print results
cat("Weighted Mean for Distance:", weighted_mean_distance, "\n")
cat("Weighted Median for Distance:", weighted_median_distance, "\n")

#3.10
# Set the working directory
setwd("C:/Users/tyrom/OneDrive/Documents")

# Read the CSV data

pizzadelivery <- read.csv("pizza_delivery.csv")

# (a) Calculate summary statistics

summary(pizzadelivery)

# (b) Calculate and interpret the 99% quantile for delivery time and temperature
quantile(pizzadelivery$time, probs = 0.99)
quantile(pizzadelivery$temperature, probs = 0.99)

# (c) Function to calculate absolute mean deviation

absolute_mean_deviation <- function(data) {
return(mean(abs(data - mean(data))))
}

# Calculate absolute mean deviation of temperature

abs_mean_deviation_temperature <-
absolute_mean_deviation(pizzadelivery$temperature)
abs_mean_deviation_temperature
# (d) Scale the delivery time and calculate mean and variance
scaled_delivery_time <- scale(pizzadelivery$time)
mean(scaled_delivery_time)
var(scaled_delivery_time)

# (e) Box plot for delivery time and temperature without extreme values
boxplot(pizzadelivery$time, outline = FALSE)
boxplot(pizzadelivery$temperature, outline = FALSE)

# (f) Had to install the dplyr package to better handle NAs by coercion error
received in earlier tries seems to be either issue with conversion or missing data
values.

# Load the dplyr library

library(dplyr)

# Create a new variable for delivery time in steps of 10 min

pizzadelivery$TimeInSteps <- cut(pizzadelivery$time, breaks = seq(0,
max(pizzadelivery$time) + 10, by = 10))

# Calculate the mean using dplyr

result <- pizzadelivery %>%
group_by(TimeInSteps) %>%
summarize(MeanDeliveryTime = mean(time, na.rm = TRUE))

# Print the result

result

# (g) QQ-plot for DeliveryTime and Temperature

qqnorm(pizzadelivery$time)
qqline(pizzadelivery$time)
qqnorm(pizzadelivery$temperature)
qqline(pizzadelivery$temperature)

Verzani Answers
100% (8)
Verzani Answers
94 pages
Modern Statistics With R
100% (3)
Modern Statistics With R
580 pages
RapidMiner Data Engineering Professional Certification Exam Quiz Answers
No ratings yet
RapidMiner Data Engineering Professional Certification Exam Quiz Answers
8 pages
MHS2 Update Instruction
100% (1)
MHS2 Update Instruction
9 pages
How To Install Aloha On Windows 7 Server 2008
No ratings yet
How To Install Aloha On Windows 7 Server 2008
3 pages
PC Troubleshooting I Syllabus
100% (2)
PC Troubleshooting I Syllabus
6 pages
Project1 - Cold Storage Case Study
No ratings yet
Project1 - Cold Storage Case Study
11 pages
7 K-Means Clustering
No ratings yet
7 K-Means Clustering
27 pages
Lab File AD PDF
No ratings yet
Lab File AD PDF
25 pages
Codigo R Diamantes
No ratings yet
Codigo R Diamantes
5 pages
Chapter 2. Pre-Processing Data
No ratings yet
Chapter 2. Pre-Processing Data
37 pages
R Program
No ratings yet
R Program
22 pages
BAN5
No ratings yet
BAN5
2 pages
Tài Liệu Không Có Tiêu Đề
No ratings yet
Tài Liệu Không Có Tiêu Đề
7 pages
R Record-1
No ratings yet
R Record-1
57 pages
R Programming
No ratings yet
R Programming
9 pages
Analysis Using Statistical: Introduction & Data Exploration
No ratings yet
Analysis Using Statistical: Introduction & Data Exploration
23 pages
Shahun Term Workr1
No ratings yet
Shahun Term Workr1
34 pages
R Note
No ratings yet
R Note
56 pages
R File Code
No ratings yet
R File Code
16 pages
Lab Manual - DSR
No ratings yet
Lab Manual - DSR
32 pages
R Code
No ratings yet
R Code
9 pages
ML Project - Jupyter Notebook
No ratings yet
ML Project - Jupyter Notebook
5 pages
Problem Set 3: General Guideline
No ratings yet
Problem Set 3: General Guideline
12 pages
Ismaykim1 PDF
No ratings yet
Ismaykim1 PDF
522 pages
Rstudio Study Notes For PA 20181126
No ratings yet
Rstudio Study Notes For PA 20181126
6 pages
Practice-Training BTTC
No ratings yet
Practice-Training BTTC
25 pages
Cluster R
No ratings yet
Cluster R
1 page
Dav Exp8
No ratings yet
Dav Exp8
10 pages
R Graphics Essentials For Great Data Visualization
No ratings yet
R Graphics Essentials For Great Data Visualization
28 pages
Hierar Varam
No ratings yet
Hierar Varam
11 pages
R Workshop Material 18-19, Oct-2023
No ratings yet
R Workshop Material 18-19, Oct-2023
67 pages
R Doc Ii Vee
No ratings yet
R Doc Ii Vee
24 pages
Mini Project - Cold Storage Case Study
No ratings yet
Mini Project - Cold Storage Case Study
8 pages
R Programming
No ratings yet
R Programming
11 pages
SML Practical 1to11
No ratings yet
SML Practical 1to11
23 pages
Commands For Data Analysis Using R
No ratings yet
Commands For Data Analysis Using R
11 pages
07C LineOfBestFit
No ratings yet
07C LineOfBestFit
10 pages
Week2 Cheat Sheet Data Wrangling With Tidyverse
No ratings yet
Week2 Cheat Sheet Data Wrangling With Tidyverse
4 pages
11 RIC Journal
No ratings yet
11 RIC Journal
46 pages
Lab Wk1soln PDF
No ratings yet
Lab Wk1soln PDF
14 pages
Projet - COLD STORAGE
No ratings yet
Projet - COLD STORAGE
21 pages
EDAV
No ratings yet
EDAV
218 pages
Lesllie Salt Company
No ratings yet
Lesllie Salt Company
15 pages
Notas
No ratings yet
Notas
19 pages
Copy Entire Document Content in R Studio
No ratings yet
Copy Entire Document Content in R Studio
17 pages
F24 Lab-01
No ratings yet
F24 Lab-01
4 pages
Bda Skill
No ratings yet
Bda Skill
34 pages
Stastistics and Probability With R Programming Language: Lab Report
50% (2)
Stastistics and Probability With R Programming Language: Lab Report
44 pages
Lab 2
No ratings yet
Lab 2
5 pages
R Session - Note2 - Updated
No ratings yet
R Session - Note2 - Updated
7 pages
Copy Entire Document Content in R Studio: R Script Compiled by Mr. Anup Sharma (Strictly To Be Used As Class Notes)
No ratings yet
Copy Entire Document Content in R Studio: R Script Compiled by Mr. Anup Sharma (Strictly To Be Used As Class Notes)
15 pages
Notes-US Census Data
No ratings yet
Notes-US Census Data
12 pages
HWK2 324 SS
100% (1)
HWK2 324 SS
7 pages
Content: Dplyr, Readr, TM, Ggplot2/+ggforce/, Tidyr, Broom Dplyr
No ratings yet
Content: Dplyr, Readr, TM, Ggplot2/+ggforce/, Tidyr, Broom Dplyr
8 pages
Recipes For Data Processing
No ratings yet
Recipes For Data Processing
51 pages
Business Analytics Unit - IV Notes - 60637706 - 2025 - 05!15!02 - 16
No ratings yet
Business Analytics Unit - IV Notes - 60637706 - 2025 - 05!15!02 - 16
28 pages
Practical Assignment-10 Mini Project Nutrition Calculator - Calculate Nutrition For Recipes
No ratings yet
Practical Assignment-10 Mini Project Nutrition Calculator - Calculate Nutrition For Recipes
16 pages
Leer
No ratings yet
Leer
19 pages
Praktikum Modul 3
No ratings yet
Praktikum Modul 3
5 pages
Manipulating Data in R
No ratings yet
Manipulating Data in R
32 pages
R
No ratings yet
R
6 pages
Project Report PDF
100% (1)
Project Report PDF
37 pages
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
From Everand
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
Manish Soni
No ratings yet
Function
No ratings yet
Function
18 pages
QmEye PC Client Introduction
No ratings yet
QmEye PC Client Introduction
16 pages
Big Data: Characteristics
No ratings yet
Big Data: Characteristics
4 pages
4g CDR New Site Mocn 12jkb0166 in - Rsudcengkareng - Ae (20221006) - Swap H3i
No ratings yet
4g CDR New Site Mocn 12jkb0166 in - Rsudcengkareng - Ae (20221006) - Swap H3i
45 pages
SQL Functions: Assignments Q
No ratings yet
SQL Functions: Assignments Q
4 pages
Roubleshooting Percona XtraDB Cluster
No ratings yet
Roubleshooting Percona XtraDB Cluster
4 pages
Dictionary of Computer Acronyms and Abbreviations B
No ratings yet
Dictionary of Computer Acronyms and Abbreviations B
10 pages
Ecs4100 12ph
No ratings yet
Ecs4100 12ph
6 pages
05 Generics
No ratings yet
05 Generics
116 pages
xps-13-l321x-mlk - Reference Guide - En-Us
No ratings yet
xps-13-l321x-mlk - Reference Guide - En-Us
22 pages
Design Patterns For Blockchain-Based Self-Sovereign Identity - European Conference On Pattern Languages of Programs
No ratings yet
Design Patterns For Blockchain-Based Self-Sovereign Identity - European Conference On Pattern Languages of Programs
15 pages
DROBO B810i+Getting+Started+Guide
No ratings yet
DROBO B810i+Getting+Started+Guide
33 pages
Huzzaz
No ratings yet
Huzzaz
24 pages
Health Monitoring Using Internet of Things (Iot)
No ratings yet
Health Monitoring Using Internet of Things (Iot)
5 pages
A Case Study of Sony Interactive Entertainment
No ratings yet
A Case Study of Sony Interactive Entertainment
6 pages
User Manual Tsi Bravo 120vac v3 4
No ratings yet
User Manual Tsi Bravo 120vac v3 4
37 pages
RST Instruments: C109 Pneumatic Readout Instruction Manual
No ratings yet
RST Instruments: C109 Pneumatic Readout Instruction Manual
25 pages
Zimbra MigrationWizard For Exchange
No ratings yet
Zimbra MigrationWizard For Exchange
24 pages
6th International Conference On Cloud Computing and IoT (CCCIoT 2025)
No ratings yet
6th International Conference On Cloud Computing and IoT (CCCIoT 2025)
2 pages
Think Project User Manual
No ratings yet
Think Project User Manual
50 pages
SRS Tun DR Ismail College (Ktdi) Online Venue Booking System
No ratings yet
SRS Tun DR Ismail College (Ktdi) Online Venue Booking System
35 pages
SC 900
No ratings yet
SC 900
8 pages
8085 ALP Five ALP To Count Even or and Odd Data Byte
No ratings yet
8085 ALP Five ALP To Count Even or and Odd Data Byte
5 pages
CMS3.0 User Manual
No ratings yet
CMS3.0 User Manual
29 pages
AWS Certified Developer - Associate Exam Dumps With PDF and VCE Download (91-120)
No ratings yet
AWS Certified Developer - Associate Exam Dumps With PDF and VCE Download (91-120)
9 pages
Configuring A Payment Method in SAP
No ratings yet
Configuring A Payment Method in SAP
3 pages

HW 1 Math 380 R Code

Uploaded by

HW 1 Math 380 R Code

Uploaded by

# 2.

# Read the CSV data

# Extract the temperature data

# Add a vertical line at 65 degrees

# Read the CSV data

# Load the ggplot2 library

# Create a histogram plot

# Read the CSV data

# Extract the driver variable

# Create a barplot to visualize the number of deliveries by driver

# (d) Set the working directory

# Read the CSV file

# Load the ggplot2 library

# Reorder the levels of the "day" variable in descending order

# Create the bar chart using qplot

iqr_altitude <- diff(quartiles_altitude)

# Calculate the weighted mean for distance

# Read the CSV data

# (a) Calculate summary statistics

# (c) Function to calculate absolute mean deviation

# Calculate absolute mean deviation of temperature

# Load the dplyr library

# Create a new variable for delivery time in steps of 10 min

# Calculate the mean using dplyr

# Print the result

# (g) QQ-plot for DeliveryTime and Temperature

You might also like