Advanced R Programming Tidyverse Notes
Advanced R Programming Tidyverse Notes
# Data Wrangaling
1)Discovering
2)Structuring
3)Cleaning
4)Enriching
5)Validation
##Data wrangling with tidyverse package
library(tidyverse)
diamonds
View(diamonds)
#Filter subdataset
diamond_sm<-filter(diamonds,cut=="Ideal")
diamond_sm
View(diamond_sm)
diamonds_sm<-filter(diamonds,cut=="Ideal",price>10000)
diamonds_sm
View(diamonds_sm)
#Filter for missing values
print(is.na(diamonds_sm))
#subset by column
diamonds_sm<-data.frame(diamonds$cut,diamonds$color)
diamonds_sm
diamonds_sm<-select(diamonds,1:4)
View(diamonds_sm)
diamonds_c<-select(diamonds,contains("c"))
diamonds_c
View(diamonds_c)
diamonds_E<-select(diamonds,price,table,depth,everything())
View(diamonds_E)
diamonds_N<-select(diamonds,-c(price,depth,table))
diamonds_N
#reorder column
diamonds_arr<-diamonds %>% arrange(color,carat)
diamonds_arr
View(diamonds_arr)
#arrange in descending order
diamonds_arr<-diamonds %>% arrange(desc(carat))
View(diamonds_arr)
#add or modify columns
diamonds_new<-diamonds %>%
mutate(mass_g=0.02*carat,price_per_carat=price/carat,
cut=tolower(cut),
expensive=price>10000)
diamonds_new
View(diamonds_new)