0% found this document useful (0 votes)

262 views5 pages

Writing Efficient R Code

The document discusses various techniques for benchmarking and optimizing R code performance including: 1) Measuring the read times of CSV and RDS files using system.time() and comparing using microbenchmark(). 2) Using benchmarkme to check the RAM and CPU specs of the machine. 3) Timing growing a vector vs pre-allocating with system.time(). 4) Comparing vectorized operations like multiplication and log-sums to for loops. 5) Timing selecting columns from a data.frame vs matrix and rows using microbenchmark().

Uploaded by

Octavio Flores

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

262 views5 pages

Writing Efficient R Code

Uploaded by

Octavio Flores

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 5

The Art of Benchmarking

R version
# Print the R version details using version
version

# Assign the variable major to the major component

major <- version$major

# Assign the variable minor to the minor component

minor <- version$minor

Comparing read times of CSV and RDS files

# How long does it take to read movies from CSV?
system.time(read.csv("movies.csv"))

# How long does it take to read movies from RDS?

system.time(readRDS("movies.rds"))

//3

Elapsed time
# Load the package
library(microbenchmark)

# Compare the two functions

compare <- microbenchmark(read.csv("movies.csv"),
readRDS("movies.rds"),
times = 10)

# Print compare
compare

//3

DataCamp hardware
# Load the package
library(benchmarkme)

# Assign the variable ram to the amount of RAM on this machine

ram <- get_ram()

# Assign the variable cpu to the cpu specs

cpu <- get_cpu()

Benchmark DataCamp's machine

# Load the package
library("benchmarkme")

# Run the benchmark

res <- benchmark_io(runs = 1, size = 5)

# Plot the results

plot(res)

//2

Timings - growing a vector

# Use <- with system.time() to store the result as res_grow
system.time(res_grow <- growing(n))
Timings - pre-allocation
# Use <- with system.time() to store the result as res_allocate
n <- 30000
system.time(res_allocate <- pre_allocate(n))

Vectorized code: multiplication

# Store your answer as x2_imp
x2_imp <- x * x

Vectorized code: calculating a log-sum

# Initial code
n <- 100
total <- 0
x <- runif(n)
for(i in 1:n)
total <- total + log(x[i])

# Rewrite in a single line. Store the result in log_sum

log_sum <- sum(log(x))

//4

Data frames and matrices - column selection

# Which is faster, mat[, 1] or df[, 1]?
microbenchmark(mat[, 1], df[, 1])

//2

Row timings
# Which is faster, mat[1, ] or df[1, ]?
microbenchmark(mat[1, ], df[1, ])

//2
//3

Profvis in action
# Load the profvis package
library(profvis)

# Profile the following code

profvis({
# Load and select data
comedies <- movies[movies$Comedy == 1, ]

# Plot data of interest

plot(comedies$year, comedies$rating)

# Loess regression line

model <- loess(rating ~ year, data = comedies)
j <- order(comedies$year)

# Add fitted line to the plot

lines(comedies$year[j], model$fitted[j], col = "red")
})

Change the data frame to a matrix

# Load the microbenchmark package
library(microbenchmark)
# The previous data frame solution is defined
# d() Simulates 6 dices rolls
d <- function() {
data.frame(
d1 = sample(1:6, 3, replace = TRUE),
d2 = sample(1:6, 3, replace = TRUE)
)
}

# Complete the matrix solution

m <- function() {
matrix(sample(1:6, 6, replace = TRUE), ncol = 2)
}

# Use microbenchmark to time m() and d()

microbenchmark(
data.frame_solution = d(),
matrix_solution = m()
)

Calculating row sums

# Example data
rolls

# Define the previous solution

app <- function(x) {
apply(x, 1, sum)
}

# Define the new solution

r_sum <- function(x) {
rowSums(x)
}

# Compare the methods

microbenchmark(
app_sol = app(rolls),
r_sum_sol = r_sum(rolls)
)

Use && instead of &

# Example data
is_double

# Define the previous solution

move <- function(is_double) {
if (is_double[1] & is_double[2] & is_double[3]) {
current <- 11 # Go To Jail
}
}

# Define the improved solution

improved_move <- function(is_double) {
if (is_double[1] && is_double[2] && is_double[3]) {
current <- 11 # Go To Jail
}
}
## microbenchmark both solutions
microbenchmark(move(is_double), improved_move(is_double), times = 1e5)

How many cores does this machine have?

# Load the parallel package
library(parallel)

# Store the number of cores in the object no_of_cores

no_of_cores <- detectCores()

# Print no_of_cores
no_of_cores

//2
//2
//3

Moving to parApply
# Determine the number of available cores.
detectCores()

# Create a cluster via makeCluster

cl <- makeCluster(2)

# Parallelize this code

parApply(cl, dd, 2, median)

# Stop the cluster

stopCluster(cl)

Using parSapply()
library("parallel")
# Create a cluster via makeCluster (2 cores)
cl <- makeCluster(2)

# Export the play() function to the cluster

clusterExport(cl, "play")

# Re-write sapply as parSapply

res <- parSapply(cl, 1:100, function(i) play())

# Stop the cluster

stopCluster(cl)

Timings parSapply()
# Set the number of games to play
no_of_games <- 1e5

## Time serial version

system.time(serial <- sapply(1:no_of_games, function(i) play()))

## Set up cluster
cl <- makeCluster(4)
clusterExport(cl, "play")

## Time parallel version

system.time(par <- parSapply(cl, 1:no_of_games, function(i) play()))

## Stop cluster
stopCluster(cl)

WHY NATIONS FAIL Chapter 4 (Summary and Reflections)
No ratings yet
WHY NATIONS FAIL Chapter 4 (Summary and Reflections)
15 pages
Chi09109 ch13
No ratings yet
Chi09109 ch13
41 pages
Jack Johnston, John DiNardo Econometric Methods, Fourth Edition PDF
75% (4)
Jack Johnston, John DiNardo Econometric Methods, Fourth Edition PDF
514 pages
Stock Watson 3U ExerciseSolutions Chapter8 Instructors
No ratings yet
Stock Watson 3U ExerciseSolutions Chapter8 Instructors
14 pages
Slides 2 Extending The RBC Model
No ratings yet
Slides 2 Extending The RBC Model
70 pages
Solutions
No ratings yet
Solutions
54 pages
Introduction To Econometrics 3rd Edition James H. Stock - Ebook PDF PDF Download
100% (4)
Introduction To Econometrics 3rd Edition James H. Stock - Ebook PDF PDF Download
46 pages
Modelo VECM para Series Financieras-1
No ratings yet
Modelo VECM para Series Financieras-1
30 pages
Basico 2 Examen Final Online (2) JETSTREAM (1) Victor Miyagui
No ratings yet
Basico 2 Examen Final Online (2) JETSTREAM (1) Victor Miyagui
4 pages
Exercise Solutions Chapter 2
No ratings yet
Exercise Solutions Chapter 2
29 pages
Exercises From Demmel Textbook
No ratings yet
Exercises From Demmel Textbook
1 page
Favar Package
No ratings yet
Favar Package
2 pages
Chapter 6: MATLAB Programs Exercises
No ratings yet
Chapter 6: MATLAB Programs Exercises
30 pages
Formula Sheet Mathematics 1 For Economics
No ratings yet
Formula Sheet Mathematics 1 For Economics
3 pages
Linear and Multiobjective Programming With Fuzzy Stochastic Extensions
No ratings yet
Linear and Multiobjective Programming With Fuzzy Stochastic Extensions
103 pages
Nikko New Product - Catalogue
No ratings yet
Nikko New Product - Catalogue
32 pages
Fudenberg and Tirole - Game Theory (Solutions Manual New)
No ratings yet
Fudenberg and Tirole - Game Theory (Solutions Manual New)
26 pages
CH 11
No ratings yet
CH 11
87 pages
Dokumen - Tips Cap 3 Bowers 1997 Actuarial Mathematics 2ed
No ratings yet
Dokumen - Tips Cap 3 Bowers 1997 Actuarial Mathematics 2ed
53 pages
Chapter 2 Jordi Gal I
No ratings yet
Chapter 2 Jordi Gal I
10 pages
Lecture 7 VAR, VECM and Multivariate Cointegration
No ratings yet
Lecture 7 VAR, VECM and Multivariate Cointegration
53 pages
Nicholson Microeconomics 7.3 7.7 Solutions
50% (2)
Nicholson Microeconomics 7.3 7.7 Solutions
4 pages
Microeconometría Bancaria
No ratings yet
Microeconometría Bancaria
62 pages
Multiple Regression Analysis, The Problem of Estimation
No ratings yet
Multiple Regression Analysis, The Problem of Estimation
53 pages
Growth Accounting Exercise PDF
No ratings yet
Growth Accounting Exercise PDF
2 pages
9662lsy PDF
No ratings yet
9662lsy PDF
361 pages
Financial Econometrics and Empirical Finance - Module 2 General Exam Solutions - July 2012
No ratings yet
Financial Econometrics and Empirical Finance - Module 2 General Exam Solutions - July 2012
25 pages
Chapter 7 Solutions
100% (1)
Chapter 7 Solutions
4 pages
Structural VAR and Applications: Jean-Paul Renne
No ratings yet
Structural VAR and Applications: Jean-Paul Renne
55 pages
Solutions To Problem Set 1: Theory of Banking - Academic Year 2016-17 Maria Bachelet February 24, 2017
No ratings yet
Solutions To Problem Set 1: Theory of Banking - Academic Year 2016-17 Maria Bachelet February 24, 2017
6 pages
Johansen Cointegration Test
No ratings yet
Johansen Cointegration Test
7 pages
Handout 15 DSGE Iris
No ratings yet
Handout 15 DSGE Iris
61 pages
Problem Set 2: Theory of Banking - Academic Year 2016-17
No ratings yet
Problem Set 2: Theory of Banking - Academic Year 2016-17
5 pages
Present Perfect Continuous
100% (1)
Present Perfect Continuous
22 pages
Department of Economics: ECONOMICS 481: Economics Research Paper and Seminar
No ratings yet
Department of Economics: ECONOMICS 481: Economics Research Paper and Seminar
15 pages
Chapter16 Distributed Lag Models
No ratings yet
Chapter16 Distributed Lag Models
30 pages
4 - LM Test and Heteroskedasticity
No ratings yet
4 - LM Test and Heteroskedasticity
13 pages
Assignment - 2 With Answer-1
No ratings yet
Assignment - 2 With Answer-1
7 pages
π=R R C Q Q Q Q: Practice problems on Module 3 (Markets) / Solutions to Questions 1 and 4
No ratings yet
π=R R C Q Q Q Q: Practice problems on Module 3 (Markets) / Solutions to Questions 1 and 4
2 pages
Econometrics I: TA Session 5: Giovanna Ubida
No ratings yet
Econometrics I: TA Session 5: Giovanna Ubida
20 pages
Micro Prelim Solutions
No ratings yet
Micro Prelim Solutions
32 pages
Weil Growth
No ratings yet
Weil Growth
72 pages
Multiple Regression Analysis: Inference: Wooldridge: Introductory Econometrics: A Modern Approach, 5e
No ratings yet
Multiple Regression Analysis: Inference: Wooldridge: Introductory Econometrics: A Modern Approach, 5e
23 pages
Harvard Economics 2020a Problem Set 4
100% (1)
Harvard Economics 2020a Problem Set 4
4 pages
Expression of Interest Bhushan - 1
No ratings yet
Expression of Interest Bhushan - 1
6 pages
Chiang/Wainwright: Fundamental Methods of Mathematical Economics Instructor S Manual
100% (2)
Chiang/Wainwright: Fundamental Methods of Mathematical Economics Instructor S Manual
5 pages
Stock Watson 3U ExerciseSolutions Chapter10 Students
100% (1)
Stock Watson 3U ExerciseSolutions Chapter10 Students
7 pages
Chap 20
No ratings yet
Chap 20
4 pages
Wiley - Student Solutions Manual To Accompany Introduction To Time Series Analysis and Forecasting - 978-0-470-43574-8
0% (1)
Wiley - Student Solutions Manual To Accompany Introduction To Time Series Analysis and Forecasting - 978-0-470-43574-8
3 pages
Course in Macroeconomics and Global Economics University of Rome 'Tor Vergata' Academic Year 2015/2016
No ratings yet
Course in Macroeconomics and Global Economics University of Rome 'Tor Vergata' Academic Year 2015/2016
5 pages
Cameron & Trivedi - Solution Manual Cap. 4-5
0% (1)
Cameron & Trivedi - Solution Manual Cap. 4-5
12 pages
ARCH Model
No ratings yet
ARCH Model
26 pages
Autocorrelation
100% (1)
Autocorrelation
172 pages
Stock Watson 4E Exercisesolutions Chapter14 Students PDF
No ratings yet
Stock Watson 4E Exercisesolutions Chapter14 Students PDF
7 pages
Turning Great Strategy Into Great Performance
100% (3)
Turning Great Strategy Into Great Performance
22 pages
Alternative To Profit Maximisation
No ratings yet
Alternative To Profit Maximisation
11 pages
Rhabdo Virus
No ratings yet
Rhabdo Virus
13 pages
Hayashi CH 1 Answers
No ratings yet
Hayashi CH 1 Answers
4 pages
University of Okara: Advertisement No. 2/2020
No ratings yet
University of Okara: Advertisement No. 2/2020
3 pages
Tax Invoice: 1046.17 Total Invoice Amount Rs
No ratings yet
Tax Invoice: 1046.17 Total Invoice Amount Rs
2 pages
Business and Economic Forecasting EMET3007/EMET8012 Problem Set 1
No ratings yet
Business and Economic Forecasting EMET3007/EMET8012 Problem Set 1
2 pages
Hyperbolic Absolute Risk Aversion (Final Presentation)
No ratings yet
Hyperbolic Absolute Risk Aversion (Final Presentation)
13 pages
Knitting Chapter
No ratings yet
Knitting Chapter
12 pages
Edraky - SD
No ratings yet
Edraky - SD
29 pages
EC744 Lecture Note 8 Applications of Stochastic DP: Prof. Jianjun Miao
No ratings yet
EC744 Lecture Note 8 Applications of Stochastic DP: Prof. Jianjun Miao
31 pages
Number System Representation - Study Notes
No ratings yet
Number System Representation - Study Notes
12 pages
Parallel Programming in R
100% (4)
Parallel Programming in R
14 pages
EC744 Lecture Note 3 Dynamic Programming Under Certainty: Prof. Jianjun Miao
No ratings yet
EC744 Lecture Note 3 Dynamic Programming Under Certainty: Prof. Jianjun Miao
17 pages
IELTS Simon Speaking Part 3 9dee133876
No ratings yet
IELTS Simon Speaking Part 3 9dee133876
37 pages
Cardiosync Corporate Business Plan
No ratings yet
Cardiosync Corporate Business Plan
7 pages
EC 744 Lecture Notes: Incomplete Markets and Bewley Models: Jianjun Miao
No ratings yet
EC 744 Lecture Notes: Incomplete Markets and Bewley Models: Jianjun Miao
39 pages
01-Sap Annual Report2023 Ang
No ratings yet
01-Sap Annual Report2023 Ang
119 pages
Introduction To TikTok Shop Affiliate Program
No ratings yet
Introduction To TikTok Shop Affiliate Program
10 pages
Introduction To Spark With Sparklyr in R
No ratings yet
Introduction To Spark With Sparklyr in R
11 pages
Econ 113 Probset3 Sol
No ratings yet
Econ 113 Probset3 Sol
7 pages
Movement in The Classroom
No ratings yet
Movement in The Classroom
7 pages
Chapter 3 Data Modeling Using The Entity Relationship ER Model
No ratings yet
Chapter 3 Data Modeling Using The Entity Relationship ER Model
55 pages
Multiple Regression Tutorial 3
100% (2)
Multiple Regression Tutorial 3
5 pages
Manual Slake Durability Device
No ratings yet
Manual Slake Durability Device
40 pages
Position Paper
No ratings yet
Position Paper
2 pages
Air Brake Rake Testing Procedure (LHB Coaches (2) - 0
No ratings yet
Air Brake Rake Testing Procedure (LHB Coaches (2) - 0
22 pages
Effectiveness of PPE Welding Presentation
No ratings yet
Effectiveness of PPE Welding Presentation
11 pages
Web Content Management System
No ratings yet
Web Content Management System
6 pages
CMAT - Module 3 Answer Key (QA - DI - LR)
No ratings yet
CMAT - Module 3 Answer Key (QA - DI - LR)
8 pages
Research Paper Mytsak
No ratings yet
Research Paper Mytsak
27 pages
Detailed Lesson Plan
No ratings yet
Detailed Lesson Plan
6 pages
Introduction To Interdisciplinary Studies 2nd Edition Repko Test Bank
100% (33)
Introduction To Interdisciplinary Studies 2nd Edition Repko Test Bank
8 pages
NTFK VOL 104 2 (3) 2017 - Henri Rikander - The Use of Electroshock Weapons by The Finnish Police 2016
No ratings yet
NTFK VOL 104 2 (3) 2017 - Henri Rikander - The Use of Electroshock Weapons by The Finnish Police 2016
34 pages
YouTube and You Learning in The Digital Age
No ratings yet
YouTube and You Learning in The Digital Age
7 pages
Scalable Data Processing in R
No ratings yet
Scalable Data Processing in R
8 pages
Visualizing Big Data With Trelliscope
No ratings yet
Visualizing Big Data With Trelliscope
7 pages
Supervised Learning in R Classification
No ratings yet
Supervised Learning in R Classification
7 pages
Wk08 Proforma Invoice Algeria 6.5
No ratings yet
Wk08 Proforma Invoice Algeria 6.5
1 page
Subdivision Warranty Bond
No ratings yet
Subdivision Warranty Bond
2 pages
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
From Everand
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
Manish Soni
No ratings yet

Writing Efficient R Code

Uploaded by

Writing Efficient R Code

Uploaded by

The Art of Benchmarking

# Assign the variable major to the major component

# Assign the variable minor to the minor component

Comparing read times of CSV and RDS files

# How long does it take to read movies from RDS?

# Compare the two functions

# Assign the variable ram to the amount of RAM on this machine

# Assign the variable cpu to the cpu specs

Benchmark DataCamp's machine

# Run the benchmark

# Plot the results

Timings - growing a vector

Vectorized code: multiplication

Vectorized code: calculating a log-sum

# Rewrite in a single line. Store the result in log_sum

Data frames and matrices - column selection

# Profile the following code

# Plot data of interest

# Loess regression line

# Add fitted line to the plot

Change the data frame to a matrix

# Complete the matrix solution

# Use microbenchmark to time m() and d()

Calculating row sums

# Define the previous solution

# Define the new solution

# Compare the methods

Use && instead of &

# Define the previous solution

# Define the improved solution

How many cores does this machine have?

# Store the number of cores in the object no_of_cores

# Create a cluster via makeCluster

# Parallelize this code

# Stop the cluster

# Export the play() function to the cluster

# Re-write sapply as parSapply

# Stop the cluster

## Time serial version

## Time parallel version

You might also like