0% found this document useful (0 votes)

6 views4 pages

RStudio

The document contains R code for analyzing birth weight data, school performance data, and wage data. It includes calculations for descriptive statistics, correlations, and visualizations using ggplot2. The analysis covers topics such as the impact of smoking on birth weight, average pass rates in schools, and the relationship between education and wages.

Uploaded by

eshaan arora

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

6 views4 pages

RStudio

Uploaded by

eshaan arora

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 4

install.

packages("wooldridge")
install.packages("ggplot2")
library(wooldridge)
library(ggplot2)
data(bwght)

#QUESTION 1

#1a. Calculate descriptive statistics for birth weight:

# Mean
mean_bwght= mean(bwght$bwght, na.rm=T)

# Median
median_bwght= median(bwght$bwght, na.rm = TRUE)

# Mode (since R does not have a built-in mode function, we'll use a custom function)
getmode= function(v) {
uniqv= unique(v)
uniqv[which.max(tabulate(match(v, uniqv)))]
}
mode_bwght=getmode(bwght$bwght)

# Quartiles
quartiles_bwght=quantile(bwght$bwght, probs = c(0.25, 0.5, 0.75), na.rm = TRUE)

# Display results
mean_bwght
median_bwght
mode_bwght
quartiles_bwght

#2a. Average number of cigarettes smoked per day:

avg_smoke= mean(bwght$cigs, na.rm = TRUE)

avg_smoke

#2b. Association between smoking and birth weight:

install.packages("ggplot2")
library("ggplot2")

ggplot(bwght, aes(x = cigs, y = bwght)) +

geom_point(aes(color = factor(cigs))) +
geom_smooth(method = "lm") +
labs(title = "Birth Weight vs. Number of Cigarettes Smoked",
x = "Number of Cigarettes Smoked",
y = "Birth Weight")

#3a. Distribution of family income:

mean_income= mean(bwght$faminc, na.rm = TRUE)

sd_income= sd(bwght$faminc, na.rm = TRUE)

mean_income
sd_income

#3b. Correlation between birth weight and log of family income:

bwght$log_income=log(bwght$faminc)

smoke_data=bwght[bwght$cigs>1, ]
cor_smoke= cor(smoke_data$bwght, smoke_data$log_income, use = "complete.obs")

non_smoke_data= bwght[bwght$cigs == 0, ]
cor_non_smoke= cor(non_smoke_data$bwght, non_smoke_data$log_income, use =
"complete.obs")
cor_smoke
cor_non_smoke

#4a. Mean of fatheduc:

mean_fatheduc= mean(bwght$fatheduc, na.rm = TRUE)

count_fatheduc= sum(!is.na(bwght$fatheduc))

mean_fatheduc
count_fatheduc

#4b. Proportion of mothers who are high school graduates:

prop_highschool= mean(bwght$motheduc >= 12, na.rm = TRUE)

prop_highschool

#4c. Average birth weight by high school graduation status:

bwght$highschool= bwght$mothed >= 12

avg_bwght_highschool= aggregate(bwght ~ highschool, data = bwght, FUN = mean)

ggplot(bwght, aes(x = factor(highschool), y = bwght)) +

geom_boxplot() +
labs(title = "Birth Weight by High School Graduation Status",
x = "High School Graduate",
y = "Birth Weight")

avg_bwght_highschool

#QUESTION 2
data(meap01)

#1
min_read4=min(meap01$read4, na.rm = TRUE)
max_read4= max(meap01$read4, na.rm = TRUE)
difference_read4= max_read4 - min_read4

min_read4
max_read4
difference_read4

#2
#Number and percentage of schools with a perfect pass rate:

perfect_pass_rate_count= sum(meap01$read4 == 100, na.rm = TRUE)

total_schools= nrow(meap01)
percentage_perfect= (perfect_pass_rate_count / total_schools)*100

pass_rate_50_count= sum(meap01$read4 == 50, na.rm = TRUE)

perfect_pass_rate_count
percentage_perfect
pass_rate_50_count

#3
#Compute the average pass rates and visualize:

avg_math4= mean(meap01$math4, na.rm = TRUE)

avg_read4= mean(meap01$read4, na.rm = TRUE)

avg_math4
avg_read4

library(ggplot2)
avg_rates= data.frame(
Subject = c("Math", "Reading"),
Average_Pass_Rate = c(avg_math4, avg_read4)
)

ggplot(avg_rates, aes(x = Subject, y = Average_Pass_Rate, fill = Subject)) +

geom_bar(stat = "identity") +
labs(title = "Average Pass Rates for Math and Reading",
x = "Subject",
y = "Average Pass Rate")

#4 a and b
#Pearson Correlation Coefficient and Scatterplot:

correlation= cor(meap01$math4, meap01$read4, use = "complete.obs")

correlation

ggplot(meap01, aes(x = math4, y = read4)) +

geom_point(aes(color = enroll)) +
geom_smooth(method = "lm", se = FALSE) +
labs(title = "Scatterplot of Math vs. Reading Pass Rates",
x = "Math Pass Rate",
y = "Reading Pass Rate") +
scale_color_distiller(palette = "Spectral")

#5
#Create categories for school size and calculate average pass rates:

meap01$size_cat= cut(meap01$enroll, breaks = c(-Inf, 300, 600, Inf), labels = c("Small

(<300)", "Medium (300-600)", "Large (>600)"))

avg_pass_rates_by_size <- aggregate(cbind(math4, read4) ~ size_cat, data = meap01, FUN =

mean, na.rm = TRUE)

ggplot(avg_pass_rates_by_size, aes(x = size_cat)) +

geom_bar(aes(y = math4, fill = "Math"), stat = "identity", position = "dodge") +
geom_bar(aes(y = read4, fill = "Reading"), stat = "identity", position = "dodge") +
labs(title = "Average Pass Rates by School Size",
x = "School Size Category",
y = "Average Pass Rate") +
scale_fill_manual(name = "Subject", values = c("Math" = "blue", "Reading" = "red"))

#QUESTION 3

data(wage1)

#1
#Calculate the average educational level, lowest, and highest years of education:

avg_education= mean(wage1$educ, na.rm = TRUE)

min_education= min(wage1$educ, na.rm = TRUE)

max_education= max(wage1$educ, na.rm = TRUE)

avg_education
min_education
max_education

#2
#Determine the average per-hour wage and interpret:

avg_wage= mean(wage1$wage, na.rm = TRUE)

avg_wage

#3
#Calculate the proportion of women and men in the sample:

prop_women= mean(wage1$female, na.rm = TRUE)

prop_men= 1 - prop_women

prop_women
prop_men

#4
#Calculate the probability that a randomly chosen woman is married:

women_data= subset(wage1, female == 1)

prop_married_women= mean(women_data$married, na.rm = TRUE)

prop_married_women

#5a. Association between Hourly Wage and Education:

library(ggplot2)

ggplot(wage1, aes(x = educ, y = wage)) +

geom_point() +
geom_smooth(method = "lm") +
labs(title = "Hourly Wage vs. Education",
x = "Years of Education",
y = "Hourly Wage")

#5b. Hourly Wage and Education by Marital Status:

ggplot(wage1, aes(x = educ, y = wage, color = factor(married))) +

geom_point() +
geom_smooth(method = "lm", se = FALSE) +
labs(title = "Hourly Wage vs. Education by Marital Status",
x = "Years of Education",
y = "Hourly Wage",
color = "Marital Status") +
scale_color_manual(values = c("blue", "red"), labels = c("Unmarried", "Married"))

#5c. Hourly Wage and Education by Gender and Marital Status:

ggplot(wage1, aes(x = educ, y = wage, color = factor(married), shape = factor(female)))

+
geom_point() +
geom_smooth(method = "lm", se = FALSE) +
labs(title = "Hourly Wage vs. Education by Gender and Marital Status",
x = "Years of Education",
y = "Hourly Wage",
color = "Marital Status",
shape = "Gender") +
scale_color_manual(values = c("blue", "red"), labels = c("Unmarried", "Married")) +
scale_shape_manual(values = c(16, 17), labels = c("Male", "Female"))

Tektronix 760 Manual
100% (3)
Tektronix 760 Manual
120 pages
SOP Overhead Crane-Rev.1
No ratings yet
SOP Overhead Crane-Rev.1
5 pages
Lab 2
No ratings yet
Lab 2
22 pages
Econ 2b03 Assignment 1
No ratings yet
Econ 2b03 Assignment 1
8 pages
BDA MSC It
No ratings yet
BDA MSC It
35 pages
Workshop Activity: X Seq y Length
No ratings yet
Workshop Activity: X Seq y Length
3 pages
Mock Exam - Appendix
No ratings yet
Mock Exam - Appendix
15 pages
R Code
No ratings yet
R Code
9 pages
IntroR 2
No ratings yet
IntroR 2
18 pages
Problem Set 1: Introduction To R - Solutions With R Output: 1 Install Packages
No ratings yet
Problem Set 1: Introduction To R - Solutions With R Output: 1 Install Packages
24 pages
Merge
No ratings yet
Merge
28 pages
BAN5
No ratings yet
BAN5
2 pages
Advanced Statistical Methods Using R
No ratings yet
Advanced Statistical Methods Using R
32 pages
Preprocessing - Preprocessing Your Data With R
No ratings yet
Preprocessing - Preprocessing Your Data With R
23 pages
Multicollinearity and Oaxaca - Tutorial
No ratings yet
Multicollinearity and Oaxaca - Tutorial
35 pages
Chapter 2 R Ggplot2 Examples
No ratings yet
Chapter 2 R Ggplot2 Examples
22 pages
CS1B April 2024
No ratings yet
CS1B April 2024
9 pages
Commands For Data Analysis Using R
No ratings yet
Commands For Data Analysis Using R
11 pages
Ggplot2 Exercise
No ratings yet
Ggplot2 Exercise
6 pages
R
No ratings yet
R
6 pages
Assignment-1 80501
No ratings yet
Assignment-1 80501
6 pages
Fixed Versus Random Effects
No ratings yet
Fixed Versus Random Effects
82 pages
R File Code
No ratings yet
R File Code
16 pages
R Training AM
No ratings yet
R Training AM
6 pages
R Practice
No ratings yet
R Practice
38 pages
R Note
No ratings yet
R Note
56 pages
Copy Entire Document Content in R Studio: R Script Compiled by Mr. Anup Sharma (Strictly To Be Used As Class Notes)
No ratings yet
Copy Entire Document Content in R Studio: R Script Compiled by Mr. Anup Sharma (Strictly To Be Used As Class Notes)
15 pages
DSA Lab
No ratings yet
DSA Lab
29 pages
Problem Set
No ratings yet
Problem Set
8 pages
Copy Entire Document Content in R Studio
No ratings yet
Copy Entire Document Content in R Studio
17 pages
R Practical
No ratings yet
R Practical
9 pages
Modelling With R
No ratings yet
Modelling With R
3 pages
Lab File AD PDF
No ratings yet
Lab File AD PDF
25 pages
DALab Part-B BCU&BU
No ratings yet
DALab Part-B BCU&BU
12 pages
R Programming-1
No ratings yet
R Programming-1
6 pages
Exercícios Da 1 Aula
No ratings yet
Exercícios Da 1 Aula
6 pages
Lecture 1
No ratings yet
Lecture 1
167 pages
2 R - Zajecia - 4 - Eng
No ratings yet
2 R - Zajecia - 4 - Eng
7 pages
Statistics Assignment
No ratings yet
Statistics Assignment
4 pages
R Multiple Regression Exercise 2019
No ratings yet
R Multiple Regression Exercise 2019
6 pages
"Cps - TXT" "Education" "South" "SEX" "Experience" "Union" "WAGE" "AGE" "RACE" "Occupat Ion" "Sector" "MARR"
No ratings yet
"Cps - TXT" "Education" "South" "SEX" "Experience" "Union" "WAGE" "AGE" "RACE" "Occupat Ion" "Sector" "MARR"
9 pages
Sta108hw4 1
No ratings yet
Sta108hw4 1
5 pages
Lab 5 EA
No ratings yet
Lab 5 EA
4 pages
Combined 8 15
No ratings yet
Combined 8 15
8 pages
BM-1, Applied Statistics, Lesson 2: Comparing Two Groups (And One Group)
No ratings yet
BM-1, Applied Statistics, Lesson 2: Comparing Two Groups (And One Group)
39 pages
DA Manual - Part B
No ratings yet
DA Manual - Part B
13 pages
Supervised Learning by Fadhlurrohman Henriwan
No ratings yet
Supervised Learning by Fadhlurrohman Henriwan
31 pages
Modeling and Visulizing Data Using R: A Practical Introduction
No ratings yet
Modeling and Visulizing Data Using R: A Practical Introduction
106 pages
R Working Materials Prep
No ratings yet
R Working Materials Prep
43 pages
Plotting With Ggplot: Install - Packages ("Ggplot2") Library (Ggplot2)
No ratings yet
Plotting With Ggplot: Install - Packages ("Ggplot2") Library (Ggplot2)
3 pages
R Studio Notes
No ratings yet
R Studio Notes
6 pages
R For Health Data Science 1st Edition Complete Volume Download
No ratings yet
R For Health Data Science 1st Edition Complete Volume Download
15 pages
Experiment 2
No ratings yet
Experiment 2
7 pages
R Practicals
No ratings yet
R Practicals
32 pages
R Stats Cheatsheet
No ratings yet
R Stats Cheatsheet
1 page
S24 Stats10 Lab1-1
No ratings yet
S24 Stats10 Lab1-1
8 pages
Lab Manual - DSR
No ratings yet
Lab Manual - DSR
32 pages
3 Ggplot PDF
No ratings yet
3 Ggplot PDF
19 pages
Regression2 Implementation
No ratings yet
Regression2 Implementation
29 pages
Notebook 2 - Linear Regression
No ratings yet
Notebook 2 - Linear Regression
11 pages
Pre-Calculus Essentials
From Everand
Pre-Calculus Essentials
Ernest Woodward
No ratings yet
No Ph.D. Game Design With Three.js
From Everand
No Ph.D. Game Design With Three.js
Nikiforos Kontopoulos
No ratings yet
Planner
No ratings yet
Planner
2 pages
Science Fair
No ratings yet
Science Fair
8 pages
Cther Crowther Marketing Event Outcomes Tactical Strategic
No ratings yet
Cther Crowther Marketing Event Outcomes Tactical Strategic
15 pages
Product Specifications
No ratings yet
Product Specifications
2 pages
Intac Reviewer 2
No ratings yet
Intac Reviewer 2
10 pages
E3a1 Guidelines AnnexJ en
No ratings yet
E3a1 Guidelines AnnexJ en
3 pages
SANS Malware Analysis & Reverse Engineering Cheat Sheet
No ratings yet
SANS Malware Analysis & Reverse Engineering Cheat Sheet
1 page
Educational Technology and Education Conferences (January To June 2012) Por Clayton R Wright
No ratings yet
Educational Technology and Education Conferences (January To June 2012) Por Clayton R Wright
56 pages
ASSIGNMENT-Construction Personnel Management
No ratings yet
ASSIGNMENT-Construction Personnel Management
13 pages
Roman Granite Catalogue Complete
No ratings yet
Roman Granite Catalogue Complete
260 pages
IEEE STD C37.42-2016 TRANG 1.24
No ratings yet
IEEE STD C37.42-2016 TRANG 1.24
2 pages
Prefabricated Housing in Japan
No ratings yet
Prefabricated Housing in Japan
25 pages
Agenda & Report 2024-2
No ratings yet
Agenda & Report 2024-2
67 pages
Combined Slides Policy Quarterly Member Roundtable 06.2024
No ratings yet
Combined Slides Policy Quarterly Member Roundtable 06.2024
17 pages
Ansys CFX Tutorials - Release 13 PDF
No ratings yet
Ansys CFX Tutorials - Release 13 PDF
636 pages
A Synopsis Report ON Credit Risk Management AT Icici Bank LTD
No ratings yet
A Synopsis Report ON Credit Risk Management AT Icici Bank LTD
19 pages
CH 2 PDF
No ratings yet
CH 2 PDF
85 pages
01 Architecture
No ratings yet
01 Architecture
22 pages
Why Use MPC Based Contact For - Bonded - Connections
No ratings yet
Why Use MPC Based Contact For - Bonded - Connections
5 pages
11th Computer Science EM Public Exam 2023 Important 5 Mark Questions English Medium PDF Download
No ratings yet
11th Computer Science EM Public Exam 2023 Important 5 Mark Questions English Medium PDF Download
1 page
Child Labor
No ratings yet
Child Labor
15 pages
Reviewer: Industrial Organizational Psychology
100% (3)
Reviewer: Industrial Organizational Psychology
35 pages
2.1 Definition of Small Business
No ratings yet
2.1 Definition of Small Business
45 pages
Recent Progress in Alkaline Water Electrolysis For Hydrogen Production and Applications.
No ratings yet
Recent Progress in Alkaline Water Electrolysis For Hydrogen Production and Applications.
20 pages
Tally and Accounting Course Notes
No ratings yet
Tally and Accounting Course Notes
35 pages
Psychrometry Chart
No ratings yet
Psychrometry Chart
7 pages
OD226071921943274000
No ratings yet
OD226071921943274000
1 page
CG 5BrochureRev1
No ratings yet
CG 5BrochureRev1
2 pages