0% found this document useful (0 votes)

13 views5 pages

Assignment-6

Uploaded by

datakushagra

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

13 views5 pages

Assignment-6

Uploaded by

datakushagra

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 5

Assignment - 6

# Load necessary libraries

install.packages("dplyr")
library(dplyr)

#Q1)
# Create the dataset
set.seed(123)
data <- data.frame(
Country = sample(c("USA", "Germany", "India", "France", "Japan", "China", "Brazil", "UK",
"Canada", "Russia",
"Italy", "South Africa", "Australia", "Spain", "Mexico", "Nigeria", "Argentina",
"Egypt", "Turkey", "Sweden"), 20, replace = FALSE),
Continent = c(rep("North America", 4), rep("Europe", 6), rep("Asia", 4), rep("Africa", 3),
rep("South America", 2), rep("Australia", 1)),
Year = sample(2000:2020, 20, replace = TRUE),
LifeExp = runif(20, 50, 85),
Pop = sample(1e6:1e8, 20, replace = TRUE),
gdpPerc = runif(20, 1000, 50000)
)
print(data)
# 1. Unique countries per continent
data %>%
group_by(Continent) %>%
summarise(UniqueCountries = n_distinct(Country))

# 2. European nation with the lowest GDP per capita in a given year
data %>%
filter(Continent == "Europe") %>%
arrange(gdpPerc) %>%
slice(1)

# 3. Average life expectancy across each continent in a given year

data %>%
group_by(Continent, Year) %>%
summarise(AverageLifeExp = mean(LifeExp, na.rm = TRUE))

# 4. Top 5 countries with the highest total GDP over all years
data %>%
mutate(TotalGDP = Pop * gdpPerc) %>%
group_by(Country) %>%
summarise(TotalGDP = sum(TotalGDP)) %>%
arrange(desc(TotalGDP)) %>%
slice(1:5)

# 5. Countries and years with life expectancy >= 80

data %>%
filter(LifeExp >= 80) %>%
select(Country, Year, LifeExp)

# 6. Top 10 countries with strongest correlation between life expectancy and GDP per capita
data %>%
group_by(Country) %>%
summarise(Correlation = cor(LifeExp, gdpPerc)) %>%
arrange(desc(abs(Correlation))) %>%
slice(1:10)

# 7. Combinations of continent (besides Asia) and year with the highest average population
data %>%
filter(Continent != "Asia") %>%
group_by(Continent, Year) %>%
summarise(AveragePop = mean(Pop, na.rm = TRUE)) %>%
arrange(desc(AveragePop)) %>%
slice(1)

# 8. Three countries with the most consistent population estimates

data %>%
group_by(Country) %>%
summarise(PopSD = sd(Pop)) %>%
arrange(PopSD) %>%
slice(1:3)

# 9. Population decreased, and life expectancy increased from the previous year
data %>%
arrange(Country, Year) %>%
group_by(Country) %>%
mutate(PopChange = Pop - lag(Pop),
LifeExpChange = LifeExp - lag(LifeExp)) %>%
filter(PopChange < 0 & LifeExpChange > 0)

#Q2)
# Create the dataset and save it as a CSV file
med_data <- data.frame(
MedID = 1:10,
Med_Name = paste0("Med", 1:10),
Company = c("A", "B", "C", "A", "B", "C", "A", "D", "E", "F"),
Manf_year = sample(2000:2020, 10, replace = TRUE),
Exp_date = as.Date(sample(18250:18500, 10, replace = TRUE), origin = "1970-01-01"),
Quantity_in_stock = sample(50:500, 10),
Sales = sample(1000:5000, 10)
)
med_data
# write.csv(med_data, "DataSet.csv", row.names = FALSE)

# Read the data file

med_data <- read.csv("DataSet.csv")

# 1. Show the first 4 records

head(med_data, 4)

# 2. Show the last 4 records

tail(med_data, 4)

# 3. Correlation between Quantity_in_stock and Exp_date

cor(med_data$Quantity_in_stock, as.numeric(med_data$Exp_date))

# 4. Bar graph for Sales with year of manufacturing

install.packages("ggplot2")
library(ggplot2)
ggplot(med_data, aes(x = factor(Manf_year), y = Sales)) +
geom_bar(stat = "identity", fill = "blue") +
labs(x = "Manufacturing Year", y = "Sales", title = "Sales by Manufacturing Year")

# 5. Companies with more than one type of medicine

med_data %>%
group_by(Company) %>%
summarise(NumMeds = n()) %>%
filter(NumMeds > 1)

# 6. Types of medicines available

unique(med_data$Med_Name)

# 7. Medicines expiring
med_data %>%
filter(Exp_date < Sys.Date())

# 8. Average stock in the store

mean(med_data$Quantity_in_stock)

# 9. Regression line between Manufacturing year and Sales

ggplot(med_data, aes(x = Manf_year, y = Sales)) +
geom_point() +
geom_smooth(method = "lm", se = FALSE, color = "red") +
labs(x = "Manufacturing Year", y = "Sales", title = "Regression of Sales vs Manufacturing
Year")

Notes Viz
100% (1)
Notes Viz
79 pages
Question No1
No ratings yet
Question No1
6 pages
20mia1032 Lab 5
No ratings yet
20mia1032 Lab 5
7 pages
Ex3
No ratings yet
Ex3
4 pages
Lab 3 (Tutorial 1)
No ratings yet
Lab 3 (Tutorial 1)
20 pages
Plotting Technique Purpose
No ratings yet
Plotting Technique Purpose
4 pages
Data Mining Assignment 1: Group 3: Ankita (BLP008), Arnab (BLP013), Kaustav (BLP025), Pubali (BLP040)
No ratings yet
Data Mining Assignment 1: Group 3: Ankita (BLP008), Arnab (BLP013), Kaustav (BLP025), Pubali (BLP040)
5 pages
R
No ratings yet
R
6 pages
R_training_AM
No ratings yet
R_training_AM
6 pages
R Note
No ratings yet
R Note
56 pages
R code
No ratings yet
R code
9 pages
Hierarchical Clustering and Experiment With Cutting The Dendrogram
No ratings yet
Hierarchical Clustering and Experiment With Cutting The Dendrogram
5 pages
Data Visualization
No ratings yet
Data Visualization
46 pages
WEEK 3 Activity - Assignment 1
No ratings yet
WEEK 3 Activity - Assignment 1
5 pages
R_record-1
No ratings yet
R_record-1
57 pages
Sahanashree Ex-2 ML (2)
No ratings yet
Sahanashree Ex-2 ML (2)
9 pages
R Course
No ratings yet
R Course
7 pages
(Practical) Programming With R
No ratings yet
(Practical) Programming With R
5 pages
EXAM1 - Muhibbul Arman Mannan: List Ls
No ratings yet
EXAM1 - Muhibbul Arman Mannan: List Ls
13 pages
Case Study[1]
No ratings yet
Case Study[1]
5 pages
Rstudio Study Notes For PA 20181126
No ratings yet
Rstudio Study Notes For PA 20181126
6 pages
Criando Data Frame
No ratings yet
Criando Data Frame
6 pages
Midterm_Project_Group_6
No ratings yet
Midterm_Project_Group_6
41 pages
IntroR 2
No ratings yet
IntroR 2
18 pages
03.python.08.plot.examples
No ratings yet
03.python.08.plot.examples
5 pages
Group 1 Project Report DA
No ratings yet
Group 1 Project Report DA
65 pages
Exploratory Analysis
No ratings yet
Exploratory Analysis
4 pages
ETW2001 A2 Instruction
No ratings yet
ETW2001 A2 Instruction
5 pages
Lab Manual _DSR
No ratings yet
Lab Manual _DSR
32 pages
AMDA Practical - A048
No ratings yet
AMDA Practical - A048
35 pages
Commands for Data Analysis using R
No ratings yet
Commands for Data Analysis using R
11 pages
Comp Lab 2 GunExample 2425
No ratings yet
Comp Lab 2 GunExample 2425
15 pages
HW 4
No ratings yet
HW 4
12 pages
Correlation
No ratings yet
Correlation
5 pages
Visualizing Big Data With Trelliscope
No ratings yet
Visualizing Big Data With Trelliscope
7 pages
Note 2
No ratings yet
Note 2
27 pages
R Poisson
No ratings yet
R Poisson
11 pages
Code (Misbha & Nishi)
No ratings yet
Code (Misbha & Nishi)
10 pages
BDA MSC It
No ratings yet
BDA MSC It
35 pages
Assignment 1
No ratings yet
Assignment 1
12 pages
Monthly Expenditure
No ratings yet
Monthly Expenditure
11 pages
Practical4 Solution-1
No ratings yet
Practical4 Solution-1
9 pages
Creating plotly maps in R
No ratings yet
Creating plotly maps in R
2 pages
Session 4 (Practice)
No ratings yet
Session 4 (Practice)
1 page
Experiment No 8
No ratings yet
Experiment No 8
11 pages
Assignment lab 2
No ratings yet
Assignment lab 2
4 pages
model_lab[1]
No ratings yet
model_lab[1]
6 pages
Digital Assignment-6: Read The Data
No ratings yet
Digital Assignment-6: Read The Data
30 pages
R Code
No ratings yet
R Code
13 pages
Intro To Analyzing Cross-Sectional Time-Series Data in R (For Students of IR & Comparative Politics)
No ratings yet
Intro To Analyzing Cross-Sectional Time-Series Data in R (For Students of IR & Comparative Politics)
18 pages
Assignment-1 80501
No ratings yet
Assignment-1 80501
6 pages
Regression and Eda
No ratings yet
Regression and Eda
47 pages
Clustering 2
No ratings yet
Clustering 2
11 pages
DVT (Lab) - R Language Manual
No ratings yet
DVT (Lab) - R Language Manual
20 pages
5_SingleVariableVisualization_2
No ratings yet
5_SingleVariableVisualization_2
20 pages
The Mighty Everest Expedition Analysis
No ratings yet
The Mighty Everest Expedition Analysis
12 pages
Cluster R
No ratings yet
Cluster R
1 page
Can We Really Live Longer - A Machine Learning Study - by Nicolasdealba - Medium
No ratings yet
Can We Really Live Longer - A Machine Learning Study - by Nicolasdealba - Medium
34 pages
Final Group Project
No ratings yet
Final Group Project
26 pages
Apache Cassandra Developer Associate - Exam Practice Tests
From Everand
Apache Cassandra Developer Associate - Exam Practice Tests
Cristian Scutaru
No ratings yet
DOP-107EG: Instruction Sheet
No ratings yet
DOP-107EG: Instruction Sheet
8 pages
Datasheet FBLT054049 en US
No ratings yet
Datasheet FBLT054049 en US
1 page
FinancialLedger IQ3014
No ratings yet
FinancialLedger IQ3014
1 page
ALARM & WARNING HAGLUNDS in HMI
No ratings yet
ALARM & WARNING HAGLUNDS in HMI
2 pages
BTech06 Syl
No ratings yet
BTech06 Syl
37 pages
Global Report - What Worries The World June 23-WEB
No ratings yet
Global Report - What Worries The World June 23-WEB
29 pages
A Blessed Happy Day Everyone! Dr. Eleanor B. Remo: Research
No ratings yet
A Blessed Happy Day Everyone! Dr. Eleanor B. Remo: Research
109 pages
Stand Battles in Anime - Google Search
No ratings yet
Stand Battles in Anime - Google Search
1 page
Application Note: Renesas R-Car H2 Platform For Automotive Infotainment
No ratings yet
Application Note: Renesas R-Car H2 Platform For Automotive Infotainment
15 pages
Ppis12-How To Reduce Hand Knife Injuries
No ratings yet
Ppis12-How To Reduce Hand Knife Injuries
4 pages
ML Unit 3
No ratings yet
ML Unit 3
2 pages
Motors PDF
No ratings yet
Motors PDF
15 pages
Tire Inspection Guide
No ratings yet
Tire Inspection Guide
38 pages
PAPER 1 Reading Passages
No ratings yet
PAPER 1 Reading Passages
3 pages
Refresher Courses
No ratings yet
Refresher Courses
4 pages
Eas.81.2.2006 Humedad Leche Polvo
No ratings yet
Eas.81.2.2006 Humedad Leche Polvo
17 pages
Leadership and The Decision
No ratings yet
Leadership and The Decision
13 pages
Troubleshooting Guide
No ratings yet
Troubleshooting Guide
2 pages
Service Manual: Model No. ESA41 2K
No ratings yet
Service Manual: Model No. ESA41 2K
24 pages
Asia Banking Corp v. Javier
No ratings yet
Asia Banking Corp v. Javier
2 pages
K-W-L Chart: (Financial Accounts) Bba - Semester 1
No ratings yet
K-W-L Chart: (Financial Accounts) Bba - Semester 1
9 pages
Anhydrous Ammonia System Piping Requirements
No ratings yet
Anhydrous Ammonia System Piping Requirements
4 pages
Express Course
No ratings yet
Express Course
135 pages
Group 11 Slides
No ratings yet
Group 11 Slides
35 pages
Germany - MBBS - Proposal
No ratings yet
Germany - MBBS - Proposal
4 pages
final ael report
No ratings yet
final ael report
7 pages
Certificate of Operation Unfired Pressure Vessels
No ratings yet
Certificate of Operation Unfired Pressure Vessels
1 page
Free Trade Area of Kenyir Lake
0% (2)
Free Trade Area of Kenyir Lake
79 pages
Bioremediation Techniques For Polluted Environment - Concept, Advantages, Limitations, and Prospects IntechOpen
No ratings yet
Bioremediation Techniques For Polluted Environment - Concept, Advantages, Limitations, and Prospects IntechOpen
33 pages
Nutella Case Study (English)
No ratings yet
Nutella Case Study (English)
1 page

Assignment-6

Uploaded by

Assignment-6

Uploaded by

Assignment - 6

# Load necessary libraries

# 3. Average life expectancy across each continent in a given year

# 5. Countries and years with life expectancy >= 80

# 8. Three countries with the most consistent population estimates

# Read the data file

# 1. Show the first 4 records

# 2. Show the last 4 records

# 3. Correlation between Quantity_in_stock and Exp_date

# 4. Bar graph for Sales with year of manufacturing

# 5. Companies with more than one type of medicine

# 6. Types of medicines available

# 8. Average stock in the store

# 9. Regression line between Manufacturing year and Sales

You might also like