R Project Document
R Project Document
STATISTICAL PROGRAMMING
WITH R LAB
Lab report submitted in partial fulfilment of the
requirements for the award of the degree of
BACHELOR OF TECHNOLOGY
IN
INFORMATION TECHNOLOGY
INDEX
SI. Cycle Name Page No Course Grade Signature
NO Outcome
1 Cycle-2 4 1
2 Cycle-3 17 1
3 Cycle-8 26 3
4 Cycle-9 40 3
5 Cycle-11 42 3
3
ANITS
CERTIFICATE
This is to certify that this report is a bonafide work carried out by M.Bala Shankar,
A.SaiSanthosh, V.HimaBindu, K.RaghunathaReddy, V.Manasa as a part of B.TECH
4th year 1st semester of Information Technology in partial fulfilment of the
requirements for the Statistical Programming With R Lab
library(tidyverse)
my_data<-as_tibble(iris)
my_data
## # A tibble: 150 × 5
## Sepal.Length Sepal.Width Petal.Length Petal.Width Species
## <dbl> <dbl> <dbl> <dbl> <fct>
## 1 5.1 3.5 1.4 0.2 setosa
## 2 4.9 3 1.4 0.2 setosa
## 3 4.7 3.2 1.3 0.2 setosa
## 4 4.6 3.1 1.5 0.2 setosa
## 5 5 3.6 1.4 0.2 setosa
## 6 5.4 3.9 1.7 0.4 setosa
## 7 4.6 3.4 1.4 0.3 setosa
## 8 5 3.4 1.5 0.2 setosa
## 9 4.4 2.9 1.4 0.2 setosa
## 10 4.9 3.1 1.5 0.1 setosa
## # ℹ 140 more rows
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 1/13
11/1/23, 11:33 PM cycle2.knit
my_data
## # A tibble: 150 × 5
## Sepal.Length Sepal.Width Petal.Length Petal.Width Species
## <dbl> <dbl> <dbl> <dbl> <fct>
## 1 5.1 3.5 1.4 0.2 setosa
## 2 4.9 3 1.4 0.2 setosa
## 3 4.7 3.2 1.3 0.2 setosa
## 4 4.6 3.1 1.5 0.2 setosa
## 5 5 3.6 1.4 0.2 setosa
## 6 5.4 3.9 1.7 0.4 setosa
## 7 4.6 3.4 1.4 0.3 setosa
## 8 5 3.4 1.5 0.2 setosa
## 9 4.4 2.9 1.4 0.2 setosa
## 10 4.9 3.1 1.5 0.1 setosa
## # ℹ 140 more rows
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 2/13
11/1/23, 11:33 PM cycle2.knit
## # A tibble: 150 × 3
## Sepal.Length Sepal.Width Petal.Length
## <dbl> <dbl> <dbl>
## 1 5.1 3.5 1.4
## 2 4.9 3 1.4
## 3 4.7 3.2 1.3
## 4 4.6 3.1 1.5
## 5 5 3.6 1.4
## 6 5.4 3.9 1.7
## 7 4.6 3.4 1.4
## 8 5 3.4 1.5
## 9 4.4 2.9 1.4
## 10 4.9 3.1 1.5
## # ℹ 140 more rows
## # A tibble: 150 × 2
## Sepal.Length Petal.Length
## <dbl> <dbl>
## 1 5.1 1.4
## 2 4.9 1.4
## 3 4.7 1.3
## 4 4.6 1.5
## 5 5 1.4
## 6 5.4 1.7
## 7 4.6 1.4
## 8 5 1.5
## 9 4.4 1.4
## 10 4.9 1.5
## # ℹ 140 more rows
## # A tibble: 150 × 2
## Sepal.Length Petal.Length
## <dbl> <dbl>
## 1 5.1 1.4
## 2 4.9 1.4
## 3 4.7 1.3
## 4 4.6 1.5
## 5 5 1.4
## 6 5.4 1.7
## 7 4.6 1.4
## 8 5 1.5
## 9 4.4 1.4
## 10 4.9 1.5
## # ℹ 140 more rows
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 3/13
11/1/23, 11:33 PM cycle2.knit
## # A tibble: 150 × 2
## Petal.Length Petal.Width
## <dbl> <dbl>
## 1 1.4 0.2
## 2 1.4 0.2
## 3 1.3 0.2
## 4 1.5 0.2
## 5 1.4 0.2
## 6 1.7 0.4
## 7 1.4 0.3
## 8 1.5 0.2
## 9 1.4 0.2
## 10 1.5 0.1
## # ℹ 140 more rows
## # A tibble: 150 × 2
## Sepal.Width Petal.Width
## <dbl> <dbl>
## 1 3.5 0.2
## 2 3 0.2
## 3 3.2 0.2
## 4 3.1 0.2
## 5 3.6 0.2
## 6 3.9 0.4
## 7 3.4 0.3
## 8 3.4 0.2
## 9 2.9 0.2
## 10 3.1 0.1
## # ℹ 140 more rows
## # A tibble: 150 × 2
## Petal.Length Petal.Width
## <dbl> <dbl>
## 1 1.4 0.2
## 2 1.4 0.2
## 3 1.3 0.2
## 4 1.5 0.2
## 5 1.4 0.2
## 6 1.7 0.4
## 7 1.4 0.3
## 8 1.5 0.2
## 9 1.4 0.2
## 10 1.5 0.1
## # ℹ 140 more rows
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 4/13
11/1/23, 11:33 PM cycle2.knit
## # A tibble: 150 × 4
## Sepal.Length Sepal.Width Petal.Length Petal.Width
## <dbl> <dbl> <dbl> <dbl>
## 1 5.1 3.5 1.4 0.2
## 2 4.9 3 1.4 0.2
## 3 4.7 3.2 1.3 0.2
## 4 4.6 3.1 1.5 0.2
## 5 5 3.6 1.4 0.2
## 6 5.4 3.9 1.7 0.4
## 7 4.6 3.4 1.4 0.3
## 8 5 3.4 1.5 0.2
## 9 4.4 2.9 1.4 0.2
## 10 4.9 3.1 1.5 0.1
## # ℹ 140 more rows
## # A tibble: 150 × 2
## Sepal.Length Petal.Length
## <dbl> <dbl>
## 1 5.1 1.4
## 2 4.9 1.4
## 3 4.7 1.3
## 4 4.6 1.5
## 5 5 1.4
## 6 5.4 1.7
## 7 4.6 1.4
## 8 5 1.5
## 9 4.4 1.4
## 10 4.9 1.5
## # ℹ 140 more rows
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 5/13
11/1/23, 11:33 PM cycle2.knit
## # A tibble: 150 × 4
## Sepal.Length Sepal.Width Petal.Length Petal.Width
## <dbl> <dbl> <dbl> <dbl>
## 1 5.1 3.5 1.4 0.2
## 2 4.9 3 1.4 0.2
## 3 4.7 3.2 1.3 0.2
## 4 4.6 3.1 1.5 0.2
## 5 5 3.6 1.4 0.2
## 6 5.4 3.9 1.7 0.4
## 7 4.6 3.4 1.4 0.3
## 8 5 3.4 1.5 0.2
## 9 4.4 2.9 1.4 0.2
## 10 4.9 3.1 1.5 0.1
## # ℹ 140 more rows
## # A tibble: 150 × 3
## Sepal.Width Petal.Width Species
## <dbl> <dbl> <fct>
## 1 3.5 0.2 setosa
## 2 3 0.2 setosa
## 3 3.2 0.2 setosa
## 4 3.1 0.2 setosa
## 5 3.6 0.2 setosa
## 6 3.9 0.4 setosa
## 7 3.4 0.3 setosa
## 8 3.4 0.2 setosa
## 9 2.9 0.2 setosa
## 10 3.1 0.1 setosa
## # ℹ 140 more rows
## # A tibble: 150 × 2
## Petal.Width Species
## <dbl> <fct>
## 1 0.2 setosa
## 2 0.2 setosa
## 3 0.2 setosa
## 4 0.2 setosa
## 5 0.2 setosa
## 6 0.4 setosa
## 7 0.3 setosa
## 8 0.2 setosa
## 9 0.2 setosa
## 10 0.1 setosa
## # ℹ 140 more rows
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 6/13
11/1/23, 11:33 PM cycle2.knit
# Drop column 1
my_data %>% select(-1)
## # A tibble: 150 × 4
## Sepal.Width Petal.Length Petal.Width Species
## <dbl> <dbl> <dbl> <fct>
## 1 3.5 1.4 0.2 setosa
## 2 3 1.4 0.2 setosa
## 3 3.2 1.3 0.2 setosa
## 4 3.1 1.5 0.2 setosa
## 5 3.6 1.4 0.2 setosa
## 6 3.9 1.7 0.4 setosa
## 7 3.4 1.4 0.3 setosa
## 8 3.4 1.5 0.2 setosa
## 9 2.9 1.4 0.2 setosa
## 10 3.1 1.5 0.1 setosa
## # ℹ 140 more rows
# Drop columns 1 to 3
my_data %>% select(-(1:3))
## # A tibble: 150 × 2
## Petal.Width Species
## <dbl> <fct>
## 1 0.2 setosa
## 2 0.2 setosa
## 3 0.2 setosa
## 4 0.2 setosa
## 5 0.2 setosa
## 6 0.4 setosa
## 7 0.3 setosa
## 8 0.2 setosa
## 9 0.2 setosa
## 10 0.1 setosa
## # ℹ 140 more rows
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 7/13
11/1/23, 11:33 PM cycle2.knit
## # A tibble: 150 × 3
## Sepal.Width Petal.Width Species
## <dbl> <dbl> <fct>
## 1 3.5 0.2 setosa
## 2 3 0.2 setosa
## 3 3.2 0.2 setosa
## 4 3.1 0.2 setosa
## 5 3.6 0.2 setosa
## 6 3.9 0.4 setosa
## 7 3.4 0.3 setosa
## 8 3.4 0.2 setosa
## 9 2.9 0.2 setosa
## 10 3.1 0.1 setosa
## # ℹ 140 more rows
## # A tibble: 6 × 5
## Sepal.Length Sepal.Width Petal.Length Petal.Width Species
## <dbl> <dbl> <dbl> <dbl> <fct>
## 1 5.1 3.5 1.4 0.2 setosa
## 2 4.9 3 1.4 0.2 setosa
## 3 4.7 3.2 1.3 0.2 setosa
## 4 4.6 3.1 1.5 0.2 setosa
## 5 5 3.6 1.4 0.2 setosa
## 6 5.4 3.9 1.7 0.4 setosa
library(tidyverse)
my_data<-as_tibble(iris)
my_data
## # A tibble: 150 × 5
## Sepal.Length Sepal.Width Petal.Length Petal.Width Species
## <dbl> <dbl> <dbl> <dbl> <fct>
## 1 5.1 3.5 1.4 0.2 setosa
## 2 4.9 3 1.4 0.2 setosa
## 3 4.7 3.2 1.3 0.2 setosa
## 4 4.6 3.1 1.5 0.2 setosa
## 5 5 3.6 1.4 0.2 setosa
## 6 5.4 3.9 1.7 0.4 setosa
## 7 4.6 3.4 1.4 0.3 setosa
## 8 5 3.4 1.5 0.2 setosa
## 9 4.4 2.9 1.4 0.2 setosa
## 10 4.9 3.1 1.5 0.1 setosa
## # ℹ 140 more rows
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 8/13
11/1/23, 11:33 PM cycle2.knit
## # A tibble: 12 × 5
## Sepal.Length Sepal.Width Petal.Length Petal.Width Species
## <dbl> <dbl> <dbl> <dbl> <fct>
## 1 7.1 3 5.9 2.1 virginica
## 2 7.6 3 6.6 2.1 virginica
## 3 7.3 2.9 6.3 1.8 virginica
## 4 7.2 3.6 6.1 2.5 virginica
## 5 7.7 3.8 6.7 2.2 virginica
## 6 7.7 2.6 6.9 2.3 virginica
## 7 7.7 2.8 6.7 2 virginica
## 8 7.2 3.2 6 1.8 virginica
## 9 7.2 3 5.8 1.6 virginica
## 10 7.4 2.8 6.1 1.9 virginica
## 11 7.9 3.8 6.4 2 virginica
## 12 7.7 3 6.1 2.3 virginica
#Multiple-column based criteria: Extract rows where Sepal.Length > 6.7 and Sepal.Width ≤ 3:
my_data %>% filter(Sepal.Length > 6.7, Sepal.Width <= 3)
## # A tibble: 10 × 5
## Sepal.Length Sepal.Width Petal.Length Petal.Width Species
## <dbl> <dbl> <dbl> <dbl> <fct>
## 1 6.8 2.8 4.8 1.4 versicolor
## 2 7.1 3 5.9 2.1 virginica
## 3 7.6 3 6.6 2.1 virginica
## 4 7.3 2.9 6.3 1.8 virginica
## 5 6.8 3 5.5 2.1 virginica
## 6 7.7 2.6 6.9 2.3 virginica
## 7 7.7 2.8 6.7 2 virginica
## 8 7.2 3 5.8 1.6 virginica
## 9 7.4 2.8 6.1 1.9 virginica
## 10 7.7 3 6.1 2.3 virginica
#Test for equality (==): Extract rows where Sepal.Length > 6.5 and Species = “versicolor”:
my_data %>% filter(Sepal.Length > 6.7, Species == "versicolor")
## # A tibble: 3 × 5
## Sepal.Length Sepal.Width Petal.Length Petal.Width Species
## <dbl> <dbl> <dbl> <dbl> <fct>
## 1 7 3.2 4.7 1.4 versicolor
## 2 6.9 3.1 4.9 1.5 versicolor
## 3 6.8 2.8 4.8 1.4 versicolor
#Using OR operator (|): Extract rows where Sepal.Length > 6.5 and (Species = “versicolor” orS
pecies = “virginica”):
#Use this:
my_data %>% filter(
Sepal.Length > 6.7,
Species == "versicolor" | Species == "virginica"
)
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 9/13
11/1/23, 11:33 PM cycle2.knit
## # A tibble: 20 × 5
## Sepal.Length Sepal.Width Petal.Length Petal.Width Species
## <dbl> <dbl> <dbl> <dbl> <fct>
## 1 7 3.2 4.7 1.4 versicolor
## 2 6.9 3.1 4.9 1.5 versicolor
## 3 6.8 2.8 4.8 1.4 versicolor
## 4 7.1 3 5.9 2.1 virginica
## 5 7.6 3 6.6 2.1 virginica
## 6 7.3 2.9 6.3 1.8 virginica
## 7 7.2 3.6 6.1 2.5 virginica
## 8 6.8 3 5.5 2.1 virginica
## 9 7.7 3.8 6.7 2.2 virginica
## 10 7.7 2.6 6.9 2.3 virginica
## 11 6.9 3.2 5.7 2.3 virginica
## 12 7.7 2.8 6.7 2 virginica
## 13 7.2 3.2 6 1.8 virginica
## 14 7.2 3 5.8 1.6 virginica
## 15 7.4 2.8 6.1 1.9 virginica
## 16 7.9 3.8 6.4 2 virginica
## 17 7.7 3 6.1 2.3 virginica
## 18 6.9 3.1 5.4 2.1 virginica
## 19 6.9 3.1 5.1 2.3 virginica
## 20 6.8 3.2 5.9 2.3 virginica
## # A tibble: 20 × 5
## Sepal.Length Sepal.Width Petal.Length Petal.Width Species
## <dbl> <dbl> <dbl> <dbl> <fct>
## 1 7 3.2 4.7 1.4 versicolor
## 2 6.9 3.1 4.9 1.5 versicolor
## 3 6.8 2.8 4.8 1.4 versicolor
## 4 7.1 3 5.9 2.1 virginica
## 5 7.6 3 6.6 2.1 virginica
## 6 7.3 2.9 6.3 1.8 virginica
## 7 7.2 3.6 6.1 2.5 virginica
## 8 6.8 3 5.5 2.1 virginica
## 9 7.7 3.8 6.7 2.2 virginica
## 10 7.7 2.6 6.9 2.3 virginica
## 11 6.9 3.2 5.7 2.3 virginica
## 12 7.7 2.8 6.7 2 virginica
## 13 7.2 3.2 6 1.8 virginica
## 14 7.2 3 5.8 1.6 virginica
## 15 7.4 2.8 6.1 1.9 virginica
## 16 7.9 3.8 6.4 2 virginica
## 17 7.7 3 6.1 2.3 virginica
## 18 6.9 3.1 5.4 2.1 virginica
## 19 6.9 3.1 5.1 2.3 virginica
## 20 6.8 3.2 5.9 2.3 virginica
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 10/13
11/1/23, 11:33 PM cycle2.knit
#Create a new demo data set from my_data by removing the grouping column “Species”:
my_data2 <- my_data %>% select(-Species)
#Select rows where all variables are greater than 2.4:
my_data2 %>% filter_all(all_vars(.> 2.4))
## # A tibble: 3 × 4
## Sepal.Length Sepal.Width Petal.Length Petal.Width
## <dbl> <dbl> <dbl> <dbl>
## 1 6.3 3.3 6 2.5
## 2 7.2 3.6 6.1 2.5
## 3 6.7 3.3 5.7 2.5
#Select rows when any of the variables are greater than 2.4:
my_data2 %>% filter_all(any_vars(.> 2.4))
## # A tibble: 150 × 4
## Sepal.Length Sepal.Width Petal.Length Petal.Width
## <dbl> <dbl> <dbl> <dbl>
## 1 5.1 3.5 1.4 0.2
## 2 4.9 3 1.4 0.2
## 3 4.7 3.2 1.3 0.2
## 4 4.6 3.1 1.5 0.2
## 5 5 3.6 1.4 0.2
## 6 5.4 3.9 1.7 0.4
## 7 4.6 3.4 1.4 0.3
## 8 5 3.4 1.5 0.2
## 9 4.4 2.9 1.4 0.2
## 10 4.9 3.1 1.5 0.1
## # ℹ 140 more rows
## # A tibble: 150 × 4
## Sepal.Length Sepal.Width Petal.Length Petal.Width
## <dbl> <dbl> <dbl> <dbl>
## 1 5.1 3.5 1.4 0.2
## 2 4.9 3 1.4 0.2
## 3 4.7 3.2 1.3 0.2
## 4 4.6 3.1 1.5 0.2
## 5 5 3.6 1.4 0.2
## 6 5.4 3.9 1.7 0.4
## 7 4.6 3.4 1.4 0.3
## 8 5 3.4 1.5 0.2
## 9 4.4 2.9 1.4 0.2
## 10 4.9 3.1 1.5 0.1
## # ℹ 140 more rows
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 11/13
11/1/23, 11:33 PM cycle2.knit
# Print
friends_data
## # A tibble: 4 × 4
## name age height married
## <chr> <dbl> <dbl> <chr>
## 1 A 27 180 yes
## 2 B 25 NA yes
## 3 C 29 NA no
## 4 D 26 169 no
## # A tibble: 2 × 4
## name age height married
## <chr> <dbl> <dbl> <chr>
## 1 B 25 NA yes
## 2 C 29 NA no
## # A tibble: 2 × 4
## name age height married
## <chr> <dbl> <dbl> <chr>
## 1 A 27 180 yes
## 2 D 26 169 no
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 12/13
11/1/23, 11:33 PM cycle2.knit
## # A tibble: 5 × 5
## Sepal.Length Sepal.Width Petal.Length Petal.Width Species
## <dbl> <dbl> <dbl> <dbl> <fct>
## 1 7.7 3.8 6.7 2.2 virginica
## 2 7.7 2.6 6.9 2.3 virginica
## 3 7.7 2.8 6.7 2 virginica
## 4 7.9 3.8 6.4 2 virginica
## 5 7.7 3 6.1 2.3 virginica
file:///C:/Users/raghu/OneDrive/Desktop/cycle2.html 13/13