0% found this document useful (0 votes)

22 views4 pages

RStudio

The document contains R code for analyzing birth weight data, school performance data, and wage data. It includes calculations for descriptive statistics, correlations, and visualizations using ggplot2. The analysis covers topics such as the impact of smoking on birth weight, average pass rates in schools, and the relationship between education and wages.

Uploaded by

eshaan arora

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

22 views4 pages

RStudio

Uploaded by

eshaan arora

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 4

install.

packages("wooldridge")
install.packages("ggplot2")
library(wooldridge)
library(ggplot2)
data(bwght)

#QUESTION 1

#1a. Calculate descriptive statistics for birth weight:

# Mean
mean_bwght= mean(bwght$bwght, na.rm=T)

# Median
median_bwght= median(bwght$bwght, na.rm = TRUE)

# Mode (since R does not have a built-in mode function, we'll use a custom function)
getmode= function(v) {
uniqv= unique(v)
uniqv[which.max(tabulate(match(v, uniqv)))]
}
mode_bwght=getmode(bwght$bwght)

# Quartiles
quartiles_bwght=quantile(bwght$bwght, probs = c(0.25, 0.5, 0.75), na.rm = TRUE)

# Display results
mean_bwght
median_bwght
mode_bwght
quartiles_bwght

#2a. Average number of cigarettes smoked per day:

avg_smoke= mean(bwght$cigs, na.rm = TRUE)

avg_smoke

#2b. Association between smoking and birth weight:

install.packages("ggplot2")
library("ggplot2")

ggplot(bwght, aes(x = cigs, y = bwght)) +

geom_point(aes(color = factor(cigs))) +
geom_smooth(method = "lm") +
labs(title = "Birth Weight vs. Number of Cigarettes Smoked",
x = "Number of Cigarettes Smoked",
y = "Birth Weight")

#3a. Distribution of family income:

mean_income= mean(bwght$faminc, na.rm = TRUE)

sd_income= sd(bwght$faminc, na.rm = TRUE)

mean_income
sd_income

#3b. Correlation between birth weight and log of family income:

bwght$log_income=log(bwght$faminc)

smoke_data=bwght[bwght$cigs>1, ]
cor_smoke= cor(smoke_data$bwght, smoke_data$log_income, use = "complete.obs")

non_smoke_data= bwght[bwght$cigs == 0, ]
cor_non_smoke= cor(non_smoke_data$bwght, non_smoke_data$log_income, use =
"complete.obs")
cor_smoke
cor_non_smoke

#4a. Mean of fatheduc:

mean_fatheduc= mean(bwght$fatheduc, na.rm = TRUE)

count_fatheduc= sum(!is.na(bwght$fatheduc))

mean_fatheduc
count_fatheduc

#4b. Proportion of mothers who are high school graduates:

prop_highschool= mean(bwght$motheduc >= 12, na.rm = TRUE)

prop_highschool

#4c. Average birth weight by high school graduation status:

bwght$highschool= bwght$mothed >= 12

avg_bwght_highschool= aggregate(bwght ~ highschool, data = bwght, FUN = mean)

ggplot(bwght, aes(x = factor(highschool), y = bwght)) +

geom_boxplot() +
labs(title = "Birth Weight by High School Graduation Status",
x = "High School Graduate",
y = "Birth Weight")

avg_bwght_highschool

#QUESTION 2
data(meap01)

#1
min_read4=min(meap01$read4, na.rm = TRUE)
max_read4= max(meap01$read4, na.rm = TRUE)
difference_read4= max_read4 - min_read4

min_read4
max_read4
difference_read4

#2
#Number and percentage of schools with a perfect pass rate:

perfect_pass_rate_count= sum(meap01$read4 == 100, na.rm = TRUE)

total_schools= nrow(meap01)
percentage_perfect= (perfect_pass_rate_count / total_schools)*100

pass_rate_50_count= sum(meap01$read4 == 50, na.rm = TRUE)

perfect_pass_rate_count
percentage_perfect
pass_rate_50_count

#3
#Compute the average pass rates and visualize:

avg_math4= mean(meap01$math4, na.rm = TRUE)

avg_read4= mean(meap01$read4, na.rm = TRUE)

avg_math4
avg_read4

library(ggplot2)
avg_rates= data.frame(
Subject = c("Math", "Reading"),
Average_Pass_Rate = c(avg_math4, avg_read4)
)

ggplot(avg_rates, aes(x = Subject, y = Average_Pass_Rate, fill = Subject)) +

geom_bar(stat = "identity") +
labs(title = "Average Pass Rates for Math and Reading",
x = "Subject",
y = "Average Pass Rate")

#4 a and b
#Pearson Correlation Coefficient and Scatterplot:

correlation= cor(meap01$math4, meap01$read4, use = "complete.obs")

correlation

ggplot(meap01, aes(x = math4, y = read4)) +

geom_point(aes(color = enroll)) +
geom_smooth(method = "lm", se = FALSE) +
labs(title = "Scatterplot of Math vs. Reading Pass Rates",
x = "Math Pass Rate",
y = "Reading Pass Rate") +
scale_color_distiller(palette = "Spectral")

#5
#Create categories for school size and calculate average pass rates:

meap01$size_cat= cut(meap01$enroll, breaks = c(-Inf, 300, 600, Inf), labels = c("Small

(<300)", "Medium (300-600)", "Large (>600)"))

avg_pass_rates_by_size <- aggregate(cbind(math4, read4) ~ size_cat, data = meap01, FUN =

mean, na.rm = TRUE)

ggplot(avg_pass_rates_by_size, aes(x = size_cat)) +

geom_bar(aes(y = math4, fill = "Math"), stat = "identity", position = "dodge") +
geom_bar(aes(y = read4, fill = "Reading"), stat = "identity", position = "dodge") +
labs(title = "Average Pass Rates by School Size",
x = "School Size Category",
y = "Average Pass Rate") +
scale_fill_manual(name = "Subject", values = c("Math" = "blue", "Reading" = "red"))

#QUESTION 3

data(wage1)

#1
#Calculate the average educational level, lowest, and highest years of education:

avg_education= mean(wage1$educ, na.rm = TRUE)

min_education= min(wage1$educ, na.rm = TRUE)

max_education= max(wage1$educ, na.rm = TRUE)

avg_education
min_education
max_education

#2
#Determine the average per-hour wage and interpret:

avg_wage= mean(wage1$wage, na.rm = TRUE)

avg_wage

#3
#Calculate the proportion of women and men in the sample:

prop_women= mean(wage1$female, na.rm = TRUE)

prop_men= 1 - prop_women

prop_women
prop_men

#4
#Calculate the probability that a randomly chosen woman is married:

women_data= subset(wage1, female == 1)

prop_married_women= mean(women_data$married, na.rm = TRUE)

prop_married_women

#5a. Association between Hourly Wage and Education:

library(ggplot2)

ggplot(wage1, aes(x = educ, y = wage)) +

geom_point() +
geom_smooth(method = "lm") +
labs(title = "Hourly Wage vs. Education",
x = "Years of Education",
y = "Hourly Wage")

#5b. Hourly Wage and Education by Marital Status:

ggplot(wage1, aes(x = educ, y = wage, color = factor(married))) +

geom_point() +
geom_smooth(method = "lm", se = FALSE) +
labs(title = "Hourly Wage vs. Education by Marital Status",
x = "Years of Education",
y = "Hourly Wage",
color = "Marital Status") +
scale_color_manual(values = c("blue", "red"), labels = c("Unmarried", "Married"))

#5c. Hourly Wage and Education by Gender and Marital Status:

ggplot(wage1, aes(x = educ, y = wage, color = factor(married), shape = factor(female)))

+
geom_point() +
geom_smooth(method = "lm", se = FALSE) +
labs(title = "Hourly Wage vs. Education by Gender and Marital Status",
x = "Years of Education",
y = "Hourly Wage",
color = "Marital Status",
shape = "Gender") +
scale_color_manual(values = c("blue", "red"), labels = c("Unmarried", "Married")) +
scale_shape_manual(values = c(16, 17), labels = c("Male", "Female"))

Manual Caterpillar 928g It28g Wheel Loaders Implements System Hydraulic Control Valves Kickout Positioner PDF
100% (11)
Manual Caterpillar 928g It28g Wheel Loaders Implements System Hydraulic Control Valves Kickout Positioner PDF
8 pages
Advanced Statistical Methods Using R
No ratings yet
Advanced Statistical Methods Using R
32 pages
R File Code
No ratings yet
R File Code
16 pages
R For Health Data Science 1st Edition Complete Volume Download
No ratings yet
R For Health Data Science 1st Edition Complete Volume Download
15 pages
DP Unit1 Notes
No ratings yet
DP Unit1 Notes
18 pages
Modelling With R
No ratings yet
Modelling With R
3 pages
Prob Lab
No ratings yet
Prob Lab
10 pages
Normality and Correlation Analysis
No ratings yet
Normality and Correlation Analysis
4 pages
Syllabus Apni Kaksha
No ratings yet
Syllabus Apni Kaksha
1 page
BAN5
No ratings yet
BAN5
2 pages
R Multiple Regression Exercise 2019
No ratings yet
R Multiple Regression Exercise 2019
6 pages
Assignment-1 80501
No ratings yet
Assignment-1 80501
6 pages
Lab 2
No ratings yet
Lab 2
22 pages
Lecture 1
No ratings yet
Lecture 1
167 pages
Descriptive Statistics & R Analysis Assignment
No ratings yet
Descriptive Statistics & R Analysis Assignment
8 pages
Assignment JTW115E 2023-2024 v5
No ratings yet
Assignment JTW115E 2023-2024 v5
5 pages
Problem Set
No ratings yet
Problem Set
8 pages
"Cps - TXT" "Education" "South" "SEX" "Experience" "Union" "WAGE" "AGE" "RACE" "Occupat Ion" "Sector" "MARR"
No ratings yet
"Cps - TXT" "Education" "South" "SEX" "Experience" "Union" "WAGE" "AGE" "RACE" "Occupat Ion" "Sector" "MARR"
9 pages
Statistics Assignment
No ratings yet
Statistics Assignment
4 pages
CS1B April 2024
No ratings yet
CS1B April 2024
9 pages
Plotting With Ggplot: Install - Packages ("Ggplot2") Library (Ggplot2)
No ratings yet
Plotting With Ggplot: Install - Packages ("Ggplot2") Library (Ggplot2)
3 pages
Sta108hw4 1
No ratings yet
Sta108hw4 1
5 pages
Multicollinearity and Oaxaca - Tutorial
No ratings yet
Multicollinearity and Oaxaca - Tutorial
35 pages
Exercícios Da 1 Aula
No ratings yet
Exercícios Da 1 Aula
6 pages
DSA Lab
No ratings yet
DSA Lab
29 pages
2 R - Zajecia - 4 - Eng
No ratings yet
2 R - Zajecia - 4 - Eng
7 pages
Problem Set 1: Introduction To R - Solutions With R Output: 1 Install Packages
No ratings yet
Problem Set 1: Introduction To R - Solutions With R Output: 1 Install Packages
24 pages
R Studio Notes
No ratings yet
R Studio Notes
6 pages
Ggplot2 Exercise
No ratings yet
Ggplot2 Exercise
6 pages
R Programming-1
No ratings yet
R Programming-1
6 pages
Copy Entire Document Content in R Studio: R Script Compiled by Mr. Anup Sharma (Strictly To Be Used As Class Notes)
No ratings yet
Copy Entire Document Content in R Studio: R Script Compiled by Mr. Anup Sharma (Strictly To Be Used As Class Notes)
15 pages
Jogger Headset Demand Forecasting
No ratings yet
Jogger Headset Demand Forecasting
4 pages
Preprocessing - Preprocessing Your Data With R
No ratings yet
Preprocessing - Preprocessing Your Data With R
23 pages
R Code
No ratings yet
R Code
9 pages
R Practical
No ratings yet
R Practical
9 pages
R
No ratings yet
R
6 pages
S24 Stats10 Lab1-1
No ratings yet
S24 Stats10 Lab1-1
8 pages
Fixed Versus Random Effects
No ratings yet
Fixed Versus Random Effects
82 pages
Mock Exam - Appendix
No ratings yet
Mock Exam - Appendix
15 pages
Fda SSIGNMENT 02
No ratings yet
Fda SSIGNMENT 02
13 pages
Plunger Lift Brochure
No ratings yet
Plunger Lift Brochure
4 pages
Copy Entire Document Content in R Studio
No ratings yet
Copy Entire Document Content in R Studio
17 pages
Dokumen - Tips Basic Flowsheeting Principles Thermart Himmelblau D M and Riggs J B 2003 Basic
No ratings yet
Dokumen - Tips Basic Flowsheeting Principles Thermart Himmelblau D M and Riggs J B 2003 Basic
111 pages
Making Salts
No ratings yet
Making Salts
29 pages
Chemistry Basics for Students
No ratings yet
Chemistry Basics for Students
16 pages
Experiment 2
No ratings yet
Experiment 2
7 pages
Combined 8 15
No ratings yet
Combined 8 15
8 pages
Lab Manual - DSR
No ratings yet
Lab Manual - DSR
32 pages
R Training AM
No ratings yet
R Training AM
6 pages
Merge
No ratings yet
Merge
28 pages
R Practicals
No ratings yet
R Practicals
32 pages
BDA MSC It
No ratings yet
BDA MSC It
35 pages
IntroR 2
No ratings yet
IntroR 2
18 pages
Commands For Data Analysis Using R
No ratings yet
Commands For Data Analysis Using R
11 pages
R Working Materials Prep
No ratings yet
R Working Materials Prep
43 pages
2 T24Updates
No ratings yet
2 T24Updates
24 pages
Azure Databricks Course Content - Pratap - Qbex Technologies - 8886230001
No ratings yet
Azure Databricks Course Content - Pratap - Qbex Technologies - 8886230001
3 pages
Workshop Activity: X Seq y Length
No ratings yet
Workshop Activity: X Seq y Length
3 pages
Supervised Learning by Fadhlurrohman Henriwan
No ratings yet
Supervised Learning by Fadhlurrohman Henriwan
31 pages
DA Manual - Part B
No ratings yet
DA Manual - Part B
13 pages
Lab File AD PDF
No ratings yet
Lab File AD PDF
25 pages
R Stats Cheatsheet
No ratings yet
R Stats Cheatsheet
1 page
R Practice
No ratings yet
R Practice
38 pages
Differentiates Kinds of Variables and Their Uses
No ratings yet
Differentiates Kinds of Variables and Their Uses
4 pages
Mathematics For Electrical Science and Physical Science, M-1, S2
No ratings yet
Mathematics For Electrical Science and Physical Science, M-1, S2
4 pages
R ggplot2 Code Examples & Tips
No ratings yet
R ggplot2 Code Examples & Tips
22 pages
DALab Part-B BCU&BU
No ratings yet
DALab Part-B BCU&BU
12 pages
Assignment 1 CHE544 20232
No ratings yet
Assignment 1 CHE544 20232
5 pages
Data Analysis for Analysts
No ratings yet
Data Analysis for Analysts
56 pages
GIS-Based Erosion Risk Mapping
No ratings yet
GIS-Based Erosion Risk Mapping
17 pages
BM-1, Applied Statistics, Lesson 2: Comparing Two Groups (And One Group)
No ratings yet
BM-1, Applied Statistics, Lesson 2: Comparing Two Groups (And One Group)
39 pages
Modeling and Visulizing Data Using R: A Practical Introduction
No ratings yet
Modeling and Visulizing Data Using R: A Practical Introduction
106 pages
UK Experkience ATF 2 X 25 KV PDF
No ratings yet
UK Experkience ATF 2 X 25 KV PDF
12 pages
CMM 26-11-15 PN CG7G0 Smoke Detector
No ratings yet
CMM 26-11-15 PN CG7G0 Smoke Detector
56 pages
Final Report v1.5 Lucknow
No ratings yet
Final Report v1.5 Lucknow
173 pages
Ccnet 10f Lec02 ch2
No ratings yet
Ccnet 10f Lec02 ch2
42 pages
Midpalatal Miniscrew Insertion The Accuracy of Di
No ratings yet
Midpalatal Miniscrew Insertion The Accuracy of Di
7 pages
Coffee Habits of Mumbai Students
No ratings yet
Coffee Habits of Mumbai Students
12 pages
DS 2CD2T23G0 I520180404aawrc12389314 - 20221006123632
No ratings yet
DS 2CD2T23G0 I520180404aawrc12389314 - 20221006123632
26 pages
Diffusion of Solids in Liquids
No ratings yet
Diffusion of Solids in Liquids
8 pages
Nimbus VTOL Manual 180306
100% (1)
Nimbus VTOL Manual 180306
11 pages
Straight To Market in An Autoinjector
No ratings yet
Straight To Market in An Autoinjector
8 pages
IPE Pre-Test 2nd Sem 23-24
No ratings yet
IPE Pre-Test 2nd Sem 23-24
3 pages
University Semester Practical Exam Schedule NOv-Dec 2024 - 3 - 5 - Semester
No ratings yet
University Semester Practical Exam Schedule NOv-Dec 2024 - 3 - 5 - Semester
6 pages
PhysRevB 97 161108
No ratings yet
PhysRevB 97 161108
5 pages
Procedure of Selant Application MC Teaching
No ratings yet
Procedure of Selant Application MC Teaching
2 pages
Get Invoice
No ratings yet
Get Invoice
2 pages
SAP Payroll Wage Types Explained: Search
No ratings yet
SAP Payroll Wage Types Explained: Search
2 pages