Skip to content

Instantly share code, notes, and snippets.

@naomispence
Created October 15, 2024 17:15
Show Gist options
  • Save naomispence/70e8f584a9db3cdd21535ca916decd0d to your computer and use it in GitHub Desktop.
Save naomispence/70e8f584a9db3cdd21535ca916decd0d to your computer and use it in GitHub Desktop.
##CHANGE VARNAME TO YOUR VARIABLE NAME; CHANGE TITLES AND X-AXIS LABELS
frequency(addhealthW5$VARNAME, title= "Frequency Distribution of YOUR VARIABLE DESCRIPTION")
#INTERPRET THE RESULT OF THE LINE ABOVE
frequency(addhealthW5$VARNAME, cumulative.percent=TRUE, title="YOUR VARIABLE DESCRIPTION")
#INTERPRET THE RESULT OF THE LINE ABOVE
ggplot(data=subset(addhealthW5, !is.na(VARNAME)), aes(x = VARNAME)) +
geom_bar(color="blue", fill="yellow", aes(y = ((..count..)/sum(..count..)))) +
scale_y_continuous(labels = scales::percent) +
ggtitle("Bar Graph of of YOUR VARIABLE DESCRIPTION, Wave 5 Add Health") +
labs(y="Percent", x="CATEGORIES") +
theme(axis.text.x=element_text(angle=-25))
#INTERPRET THE RESULT OF THE LINE ABOVE
ggplot(data = addhealthW5, aes(x = VARNAME)) +
geom_histogram(color="blue", fill="green", binwidth =1, aes(y=(..count../sum(..count..))*100)) +
ggtitle("Distribution of YOUR VARIABLE DESCRIPTION, Add Health Wave 5") +
labs(y="Percent", x="UNIT OF MEASUREMENT")
#INTERPRET THE RESULT OF THE LINE ABOVE
MODE(addhealthW5$VARNAME)
#INTERPRET THE RESULT OF THE LINE ABOVE
median(addhealthW5$VARNAME, na.rm=TRUE)
#INTERPRET THE RESULT OF THE LINE ABOVE
summary(addhealthW5$VARNAME, na.rm=TRUE)
#INTERPRET THE RESULT OF THE LINE ABOVE
sd(addhealthW5$VARNAME, na.rm=TRUE)
#INTERPRET THE RESULT OF THE LINE ABOVE
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment