r-cheatsheet-ABCD

Uploaded by

perazajesus26

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

0 views

r-cheatsheet-ABCD

Uploaded by

perazajesus26

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 3

Advanced Statistics and Data Science (ABCD) CHEAT SHEET

Word Equations Summary Tables Simple Statistics

outcome = explanatory + other stuff # compute five-number summary mean(data_set$Y)
favstats(~ Y, data = data_set) var(data_set$Y)
Y = X + other stuff sd(data_set$Y)
# create frequency table
Basics tally(data_set$Y) cohensD(Y ~ X, data = data_set)
tally(~ Y, data = data_set) cor(Y ~ X, data = data_set)
print("Hello world!")
# tally by condition b1(Y ~ X, data = data_set)
# assign value to object tally(~ Y < 1900, data = data_set) b1(one_model)
my_number <- 5
# two-way frequency table pre(Y ~ X, data = data_set)
# combine values into vector tally(Y ~ X, data = data_set, margin = TRUE, f(Y ~ X, data = data_set)
my_vector <- c(1, 2, 3) format = “proportion”)
# sample F for X2
# first element in vector f(Y ~ X1 + X2,
my_vector[1] data = data_set, predictor = ~X2)

# orders values or cases

sort(my_vector) Data Frame
# arithmetic operations # structure of data frame # arrange rows by variable
sum(1, 2, 100), +, -, *, / str(data_set) arrange(data_set, Y)
sqrt(157)
abs(data_set$Y) # view first/last six rows # creates data frame from csv file
head(data_set) data_set <- read.csv("file_name", header = TRUE)
# logical operations tail(data_set)
>, <, >=, <=, ==, !=, |, & # convert quantitative variable
# select multiple variables # to categorical
# results in a new variable with values select(data_set, Y1, Y2) factor(data_set$Y)
# of TRUE or FALSE factor(data_set$Y,
data_set$C <- data_set$A > data_set$B # first six rows of selected variables levels = c(1,2),
head(select(data_set, Y1, Y2)) labels = c("A", "B"))

Probability Distribution # transform values

# select variable (a column) recode(data_set$Y, "0" = 0, "1" = 50, "2" = 100)
# calculate the probability area
xpnorm(65.1, data_set$mean, data_set$sd) data_set$Y
# creates two equal sized groups
# find rows that meet condition ntile(data_set$Y, 2)
zscore(data_set$Y)
data_set[data_set$Y > 40] # convert categorical variable
# returns t at this probability filter(data_set, Y > 300) # to quantitative
qt(.975, df = 999) as.numeric(data_set$Y)
# returns F at this probability # find rows that do not have NA
qf(.95, df1 = 1, df2 = 100) filter(data_set, is.na(Y) == FALSE)
filter(data_set, !is.na(Y))
# CI using t distribution
confint(empty_model)

# calculate p-value using F-distribution

xpf(sample_f, df1 = 2 , df2 = 10)

Page: 1 ▷ Updated: 2024-10 ▷ Learn more about CourseKata @ https://coursekata.org

Advanced Statistics and Data Science (ABCD) CHEAT SHEET
Simulation Fitting and Evaluating Models
# sample without replacement # randomize sampling distribution of b1s, # empty model
sample(data_set, 6) # centered on 0 empty_model <- lm(Y ~ NULL,
sdob1 <- do(1000) * data = data_set)
# sample with replacement b1(shuffle(Y) ~ X, data = data_set)
resample(data_set, 10) # use one explanatory variable
# bootstrap sampling distribution of b1s, one_model <- lm(Y ~ X, data = data_set)
do(3) * resample (data_set, 10) # centered on sample b1
sdob1_boot <- do(1000) * # use more than one explanatory variable
# mixes up values in a variable b1(Y ~ X, data = resample(data_set)) # multivariate model
shuffle(data_set$Y) multi_model <- lm(Y ~ X1 + X2, data = data_set)
# count the number of b1s at the upper
# simulate sampling 10000 Ys # and lower extreme # all the model comparisons that can be
# from normal distribution tally(sdob1$b1 > sample_b1 | # made in relation to the multivariate model
sim_Y <- rnorm(10000, Y_stats$mean, sdob1$b1 < -sample_b1) generate_models(multi_model)
Y_stats$sd)
# model predictions and residuals
# put simulated Ys into dataframe # return TRUE for middle 95% of distribution data_set$empty_predict <- predict(empty_model)
data_set<- data.frame(sim_Y) middle(sdob1$b1, .95) data_set$empty_resid <- resid(empty_model)
# randomize sampling distribution of PREs # produce ANOVA table
# simulate
sdopre <- do(1000) * pre(shuffle(Y) ~ X, anova(empty_model)
# sampling distribution of means data = data_set)
sdom_sim <- do(10000) * mean(rnorm(157, supernova(one_model)
Y_stats$mean, Y_stats$sd)) # randomize sampling distribution of Fs
sdof <- do(1000) * # t-test, using pooled variance
# bootstrap f(shuffle(Y) ~ X, data = data_set) t.test(Tip ~ Condition, data = data_set,
# sampling distribution of means var.equal=TRUE)
sdom_boot <- do(10000) * # counts extreme Fs
mean(resample(data_set$Y, 157)) sample_f <- f(shuffle(Y) ~ X, data = data_set) # pairwise comparison corrections:
tally(~f > sample_f, data = sdof) # "Tukey","Bonferroni","none"
pairwise(one_model, correction = "none")

Page: 2 ▷ Updated: 2024-10 ▷ Learn more about CourseKata @ https://coursekata.org

Advanced Statistics and Data Science (ABCD) CHEAT SHEET
Visualizations
gf_histogram(~ Y, data = data_set) %>% # sampling distribution of b1
gf_point(Y ~ X, data = data_set) # change labels gf_histogram(~b1, data = sdob1,
gf_labs(title = "Graph Title", fill = ~middle(b1, .95)) %>%
x = "Y_Name", y = "Frequency") # modify the limits on x- and y-axes
gf_lims(x = c(-12, 12), y = c(0, 70))

gf_jitter(Y ~ X, data = data_set)

# faceted grid of histograms
gf_histogram(~ Y, data = data_set) %>%
gf_facet_grid(X ~ .)

gf_point(Y ~ X, data = data_set) %>%

# add model predictions as red points
gf_point(Y ~ X , shape = 1, size = 3,
color = "firebrick") %>%
# add best fitting model as a red line
gf_boxplot(Y ~ X, data = data_set) gf_model(one_model, color = “red”)

gf_dhistogram(~ Y, data = data_set,

fill = "orange") %>%
gf_density()

gf_boxplot(Y ~ X, data = data_set, fill = pairwise(one_model, plot = TRUE)

"orange") %>%
gf_jitter(height = 0, alpha = .2, size = 3)
gf_bar( ~ Y, data = data_set)

Page: 3 ▷ Updated: 2024-10 ▷ Learn more about CourseKata @ https://coursekata.org

R Cheat Sheet Merged
100% (2)
R Cheat Sheet Merged
35 pages
R Cheat Sheet
No ratings yet
R Cheat Sheet
4 pages
r-cheatsheet-ABCD (1)
No ratings yet
r-cheatsheet-ABCD (1)
3 pages
r-cheatsheet-ABC
No ratings yet
r-cheatsheet-ABC
3 pages
r-cheatsheet-ABC (1)
No ratings yet
r-cheatsheet-ABC (1)
3 pages
CourseKata r Cheatsheet ABC (1)
No ratings yet
CourseKata r Cheatsheet ABC (1)
5 pages
r-cheatsheet-ABCD (3)
No ratings yet
r-cheatsheet-ABCD (3)
4 pages
A Short List of Some Useful R Commands: Input and Display
No ratings yet
A Short List of Some Useful R Commands: Input and Display
2 pages
A Short List of The Most Useful R Commands
No ratings yet
A Short List of The Most Useful R Commands
11 pages
R Course
No ratings yet
R Course
7 pages
A Short List of The Most Useful R Commands
No ratings yet
A Short List of The Most Useful R Commands
8 pages
R Intro 2011
No ratings yet
R Intro 2011
115 pages
BAN5
No ratings yet
BAN5
2 pages
Cost Practical
No ratings yet
Cost Practical
13 pages
STAT-2450 Assignment 1: Name:, Student ID: B00
No ratings yet
STAT-2450 Assignment 1: Name:, Student ID: B00
9 pages
STTN 225 R Summary
No ratings yet
STTN 225 R Summary
18 pages
UL2
No ratings yet
UL2
2 pages
Workshop Activity: X Seq y Length
No ratings yet
Workshop Activity: X Seq y Length
3 pages
Basics: TH TH TH TH TH TH TH
No ratings yet
Basics: TH TH TH TH TH TH TH
3 pages
Final Cost Practical
No ratings yet
Final Cost Practical
29 pages
R Commands
No ratings yet
R Commands
5 pages
Ali
No ratings yet
Ali
31 pages
Big Data Slip Solution
No ratings yet
Big Data Slip Solution
18 pages
Session Set Working Directory Choose Directlry
No ratings yet
Session Set Working Directory Choose Directlry
17 pages
Chapter 5
No ratings yet
Chapter 5
22 pages
R Commands: Appendix B
No ratings yet
R Commands: Appendix B
5 pages
R_Tutorial
No ratings yet
R_Tutorial
32 pages
Basics of Statistics and Probability - FP: Statistical Measures
No ratings yet
Basics of Statistics and Probability - FP: Statistical Measures
12 pages
Huraira
No ratings yet
Huraira
26 pages
Commands for Data Analysis using R
No ratings yet
Commands for Data Analysis using R
11 pages
R Cheat Sheet: 1. Basics 4. Input and Export of Data
100% (1)
R Cheat Sheet: 1. Basics 4. Input and Export of Data
4 pages
Essential R
No ratings yet
Essential R
261 pages
R Tutorial #1: Applied Econometrics (Econ3005)
No ratings yet
R Tutorial #1: Applied Econometrics (Econ3005)
21 pages
R Intro STAT5000
No ratings yet
R Intro STAT5000
17 pages
R Programming Practical File
No ratings yet
R Programming Practical File
38 pages
FM Statistics, Fall 2022, Homework 02
No ratings yet
FM Statistics, Fall 2022, Homework 02
8 pages
Analysis Using Statistical: Introduction & Data Exploration
No ratings yet
Analysis Using Statistical: Introduction & Data Exploration
23 pages
Lab file AD pdf
No ratings yet
Lab file AD pdf
25 pages
COST - JournalPracticals (1-7)
No ratings yet
COST - JournalPracticals (1-7)
22 pages
R Examples
No ratings yet
R Examples
56 pages
R Syntax Examples 1
No ratings yet
R Syntax Examples 1
6 pages
Merge
No ratings yet
Merge
28 pages
R Programing Bhagu
No ratings yet
R Programing Bhagu
40 pages
Econometrics 2019 PDF
No ratings yet
Econometrics 2019 PDF
143 pages
Module - 4 (R Training) - Basic Stats & Modeling
No ratings yet
Module - 4 (R Training) - Basic Stats & Modeling
15 pages
Practical 5 2
No ratings yet
Practical 5 2
7 pages
Using R For Introductory Statistics 1st Edition John Verzani - The full ebook version is just one click away
No ratings yet
Using R For Introductory Statistics 1st Edition John Verzani - The full ebook version is just one click away
46 pages
Cours BI - R
No ratings yet
Cours BI - R
18 pages
34314
No ratings yet
34314
51 pages
R Complete
No ratings yet
R Complete
24 pages
R Commands
No ratings yet
R Commands
2 pages
Introduction To R PDF
No ratings yet
Introduction To R PDF
56 pages
Useful R Functions-1
No ratings yet
Useful R Functions-1
4 pages
Mid Sem-1 - Faids
No ratings yet
Mid Sem-1 - Faids
2 pages
R Console
No ratings yet
R Console
6 pages
RSTUDIO
No ratings yet
RSTUDIO
44 pages
R Code
No ratings yet
R Code
13 pages
DSR LAB MANUAL - 10 programs
No ratings yet
DSR LAB MANUAL - 10 programs
34 pages
The Essential R Reference
From Everand
The Essential R Reference
Mark Gardener
No ratings yet
Calculus I Essentials
From Everand
Calculus I Essentials
Editors of REA
1/5 (1)
How To Configure FCIP On Brocade 7500's
No ratings yet
How To Configure FCIP On Brocade 7500's
10 pages
Literature Review On Internet Service Providers
100% (2)
Literature Review On Internet Service Providers
9 pages
Pilot 480V
No ratings yet
Pilot 480V
1 page
Wearable_Technology_Seminar_Report
No ratings yet
Wearable_Technology_Seminar_Report
4 pages
Unit 6 Testing of Ic Engine
No ratings yet
Unit 6 Testing of Ic Engine
15 pages
FW3550 19.0v1 Troubleshooting Multifactor Authentication On Sophos Firewall
No ratings yet
FW3550 19.0v1 Troubleshooting Multifactor Authentication On Sophos Firewall
11 pages
Digital Logic Syllabus
No ratings yet
Digital Logic Syllabus
5 pages
Chapter 4 - LOOKUP AND REFERENCES FUNCTIONS
No ratings yet
Chapter 4 - LOOKUP AND REFERENCES FUNCTIONS
8 pages
3147411 - Migration Cockpit Direct Transfer approach - Fixed Asset( including Balance)
No ratings yet
3147411 - Migration Cockpit Direct Transfer approach - Fixed Asset( including Balance)
2 pages
Linear Functions Test 4C-4G 2020
No ratings yet
Linear Functions Test 4C-4G 2020
5 pages
Emerging Technologies in Education 2
No ratings yet
Emerging Technologies in Education 2
7 pages
Isabella Costa Resume
No ratings yet
Isabella Costa Resume
2 pages
Desing and Analysis of Pole For Hybrid Energy System With Led Street Light
No ratings yet
Desing and Analysis of Pole For Hybrid Energy System With Led Street Light
9 pages
VH 6.0-Administrator - User Guide
No ratings yet
VH 6.0-Administrator - User Guide
280 pages
CET® Onsite Alternate Energy
No ratings yet
CET® Onsite Alternate Energy
7 pages
Injury: Michail E. Klontzas, Georgios Z. Papadakis, Kostas Marias, Apostolos H. Karantanas
No ratings yet
Injury: Michail E. Klontzas, Georgios Z. Papadakis, Kostas Marias, Apostolos H. Karantanas
9 pages
Price List Apple Education (NPI 19 October 2022)
No ratings yet
Price List Apple Education (NPI 19 October 2022)
9 pages
SH III Manual - English
No ratings yet
SH III Manual - English
31 pages
Reading Comprehension
No ratings yet
Reading Comprehension
22 pages
Synchronous Machines Questions Part-02
No ratings yet
Synchronous Machines Questions Part-02
25 pages
Mtech ECE Syllabus 04 01 23
No ratings yet
Mtech ECE Syllabus 04 01 23
112 pages
Share Market Course Details
No ratings yet
Share Market Course Details
3 pages
Error Code: Display Example
No ratings yet
Error Code: Display Example
1 page
T2720 Datasheet 0010
No ratings yet
T2720 Datasheet 0010
1 page
Expired Opp HW North 10-29-2021 - SB
No ratings yet
Expired Opp HW North 10-29-2021 - SB
10 pages
Determining Probabilities
No ratings yet
Determining Probabilities
5 pages
Hotel Dashboard
No ratings yet
Hotel Dashboard
41 pages
Test Case Writing
No ratings yet
Test Case Writing
10 pages
EasyWOODIng manual book
No ratings yet
EasyWOODIng manual book
455 pages
Flyer HumaScopeLine EN
No ratings yet
Flyer HumaScopeLine EN
12 pages

r-cheatsheet-ABCD

Uploaded by

r-cheatsheet-ABCD

Uploaded by

Advanced Statistics and Data Science (ABCD) CHEAT SHEET

Word Equations Summary Tables Simple Statistics

# orders values or cases

Probability Distribution # transform values

# calculate p-value using F-distribution

Page: 1 ▷ Updated: 2024-10 ▷ Learn more about CourseKata @ https://coursekata.org

Page: 2 ▷ Updated: 2024-10 ▷ Learn more about CourseKata @ https://coursekata.org

gf_jitter(Y ~ X, data = data_set)

gf_point(Y ~ X, data = data_set) %>%

gf_dhistogram(~ Y, data = data_set,

gf_boxplot(Y ~ X, data = data_set, fill = pairwise(one_model, plot = TRUE)

Page: 3 ▷ Updated: 2024-10 ▷ Learn more about CourseKata @ https://coursekata.org

You might also like