0% found this document useful (0 votes)

2 views17 pages

File 2

The document contains a series of R programming tasks including data analysis using built-in datasets, implementing various algorithms such as Linear Regression, Support Vector Machine, Decision Trees, Naive Bayes, K-Nearest Neighbors, and K-Means Clustering. It also includes tasks for creating patterns with asterisks and calculating factorials. Each task is presented with code snippets demonstrating the implementation of the respective functionality.

Uploaded by

harshilsonibusiness

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

2 views17 pages

File 2

Uploaded by

harshilsonibusiness

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 17

17) Write an R program to print, get information, print variable values,

sort variable values and analyse data for the inbuilt dataset.

# Load the built-in dataset

data("PlantGrowth")

# 1. Print the dataset

print("Dataset - PlantGrowth:")
print(PlantGrowth)

# 2. Get basic information about the dataset

print("Structure of the dataset:")
str(PlantGrowth)

print("Summary of the dataset:")

summary(PlantGrowth)

# 3. Print variable values

print("Values of 'weight' variable:")
print(PlantGrowth$weight)

print("Values of 'group' variable:")

print(PlantGrowth$group)

# 4. Sort the 'weight' variable in ascending order

print("Sorted weights (ascending):")
print(sort(PlantGrowth$weight))

sorted_df <- PlantGrowth[order(PlantGrowth$weight), ]

print("Data frame sorted by weight:")
print(sorted_df)

# 5. Analyze the data

mean_weight <- mean(PlantGrowth$weight)
cat("Mean of weights:", mean_weight, "\n")

sd_weight <- sd(PlantGrowth$weight)

cat("Standard deviation of weights:", sd_weight, "\n")

boxplot(weight ~ group, data = PlantGrowth,

main = "Weight by Treatment Group",
xlab = "Group", ylab = "Weight",
col = c("lightblue", "lightgreen", "lightcoral"))

group_counts <- table(PlantGrowth$group)

print("Count of samples in each group:")
print(group_counts)
21) Write an R Program to find Factorial of a number.

num <- as.numeric(readline("Enter a number: "))

factorial <- 1
if (num >= 0) {
for (i in 1:num)
{
factorial <- factorial * i
}
cat("Factorial of", num, "is:", factorial, "\n")
} else {
cat("Factorial is not defined for negative numbers.\n")
}

22) Write an R Program to print the following pattern

* *
** **
*** ***
*******

rows <- 4
for (i in 1:rows)
{ cat(rep("*", i), sep =
"")

spaces <- 2 * (rows - i)

cat(rep(" ", spaces), sep = "")
cat(rep("*", i), sep = "") cat("\
n")
}

23) Write an R Program to print the following pattern

*
**
***
****
rows <- 4
for (i in 1:rows) {
cat(rep(" ", rows - i), sep = "")

cat(rep("*", i), sep = "")

cat("\n")
}
24) Write an R Program to print the following pattern
*
**
***
****
rows <- 4
for (i in 1:rows) {
cat(rep(" ", rows - i), sep = "")

cat(rep("* ", i), sep = "") cat("\

n")
}

25) Write an R Program to print the following pattern

*
***
*****
***
*
rows <- 3
for (i in 1:rows) {
cat(rep(" ", rows - i), sep = "")

cat(rep("* ", i), sep = "")

cat("\n")
}

for (i in (rows - 1):1)

{ cat(rep(" ", rows - i), sep =
"")
cat(rep("* ", i), sep = "")

cat("\n")
}

26) Write an R Program to process the dataset by using its functions.

library(dplyr)
data <- iris
head(data)
sum(is.na(data))

summary_data <- data %>%

summarise(mean_Sepal.Length = mean(Sepal.Length, na.rm = TRUE),
max_Sepal.Length = max(Sepal.Length, na.rm = TRUE),
min_Sepal.Length = min(Sepal.Length, na.rm = TRUE))

species_summary <- data %>%

group_by(Species) %>%
summarise(mean_Sepal.Length = mean(Sepal.Length, na.rm = TRUE))

print(summary_data)
print(species_summary)

plot(data$Sepal.Length,
data$Sepal.Width, main = "Sepal
Length vs Sepal Width",
xlab = "Sepal Length", ylab = "Sepal Width",
col = data$Species, pch = 19)
27) Write an R Program to implement Linear Regression Algorithm.

library(ggplot2)
library(readr)
library(caret)

dataset <- read_csv("preprocessed_diabetes_dataset.csv")

head(dataset)

model <- lm(Glucose ~ BMI, data = dataset)

summary(model)

dataset$Predicted_Glucose <- predict(model, newdata = dataset)

plot <- ggplot(dataset, aes(x = BMI, y = Glucose)) +

geom_point(color = "blue", alpha = 0.5) + # Scatter plot of actual
values

geom_line(aes(y = Predicted_Glucose), color = "red", size = 1) + #

Regression line

labs(title = "Linear Regression: Glucose vs BMI",

x = "BMI",
y = "Glucose") +
theme_minimal()

print(plot)
28) Write an R program to implement a Support Vector
Machine Algorithm.

if (!require(e1071)) {
install.packages("e1071")
library(e1071)
}
data(iris)
set.seed(123)

sample_index <- sample(1:nrow(iris), 0.7 * nrow(iris))

train_data <- iris[sample_index, ]
test_data <- iris[-sample_index, ]

svm_model <- svm(Species ~ ., data = train_data, kernel = "linear")

predictions <- predict(svm_model, test_data)

conf_matrix <- table(Predicted = predictions, Actual = test_data$Species)

print(conf_matrix)
accuracy <- sum(diag(conf_matrix)) / sum(conf_matrix)
cat("Accuracy:", round(accuracy * 100, 2), "%\n")
29) Write an R program to implement a Decision Tree Algorithm.

# Load necessary libraries

if (!require(rpart)) install.packages("rpart")
if (!require(rpart.plot)) install.packages("rpart.plot")
library(rpart)
library(rpart.plot)

# Load dataset
diabetes <- read.csv("diabetes_data.csv")

# Set seed
set.seed(123)

# Split data into training (70%) and testing (30%)

sample_index <- sample(1:nrow(diabetes), 0.7 * nrow(diabetes))
train_data <- diabetes[sample_index, ]
test_data <- diabetes[-sample_index, ]

# Build decision tree model

tree_model <- rpart(Outcome ~ ., data = train_data, method = "class")

# Plot the tree

rpart.plot(tree_model, main = "Decision Tree for Diabetes Prediction")

# Make predictions
predictions <- predict(tree_model, test_data, type = "class")
# Confusion matrix
conf_matrix <- table(Predicted = predictions, Actual =
test_data$Outcome)
print(conf_matrix)

# Accuracy
accuracy <- sum(diag(conf_matrix)) / sum(conf_matrix)
cat("Accuracy:", round(accuracy * 100, 2), "%\n")
30) Write an R program to implement a Naive Bayes Algorithm.
if (!require(e1071)) {
install.packages("e1071")
library(e1071)
}

data(mtcars)
mtcars$am <- as.factor(mtcars$am)
set.seed(123)

sample_index <- sample(1:nrow(mtcars), 0.7 * nrow(mtcars))

train_data <- mtcars[sample_index, ]
test_data <- mtcars[-sample_index, ]

nb_model <- naiveBayes(am ~ ., data = train_data)

predictions <- predict(nb_model, test_data)

conf_matrix <- table(Predicted = predictions, Actual = test_data$am)

print(conf_matrix)

accuracy <- sum(diag(conf_matrix)) / sum(conf_matrix)

cat("Accuracy:", round(accuracy * 100, 2), "%\n")
31) Write an R program to implement a K-Nearest
Neighbour Algorithm.

# Install and load required libraries

if (!require(class)) {
install.packages("class")
library(class)
}

# Load the dataset

wine_data <- read.csv("redwinequality.csv")

# View the first few rows of the dataset

head(wine_data)

# Convert 'quality' to a factor (since it's the target variable)

wine_data$quality <- as.factor(wine_data$quality)

# Set seed for reproducibility

set.seed(123)

# Split the dataset into training (70%) and testing (30%) sets
sample_index <- sample(1:nrow(wine_data), 0.7 * nrow(wine_data))
train_data <- wine_data[sample_index, ]
test_data <- wine_data[-sample_index, ]

# Separate features and target variable for both train and test sets
train_x <- train_data[, -ncol(wine_data)] # All columns except 'quality'
train_y <- train_data$quality # Target variable (quality)
test_x <- test_data[, -ncol(wine_data)] # All columns except
'quality' test_y <- test_data$quality # Target variable (quality)

# Train the KNN model (k = 3)

k_value <- 3
knn_predictions <- knn(train_x, test_x, train_y, k = k_value)

# Confusion matrix
conf_matrix <- table(Predicted = knn_predictions, Actual = test_y)
print(conf_matrix)

# Calculate accuracy
accuracy <- sum(diag(conf_matrix)) / sum(conf_matrix)
cat("Accuracy:", round(accuracy * 100, 2), "%\n")
32) Write an R program to implement a K-Means
Clustering Algorithm.

data("USArrests")
head(USArrests)
USArrests <- na.omit(USArrests)

scaled_data <- scale(USArrests)

set.seed(123)

kmeans_result <- kmeans(scaled_data, centers = 3, nstart = 25)

print(kmeans_result)

USArrests$Cluster <- as.factor(kmeans_result$cluster)

if (!require(ggplot2)) {
install.packages("ggplot2")
library(ggplot2)
}

pca_result <- prcomp(scaled_data)

pca_data <- data.frame(pca_result$x[, 1:2], Cluster = USArrests$Cluster)

ggplot(pca_data, aes(x = PC1, y = PC2, color = Cluster)) +

geom_point(size = 3) +
labs(title = "K-means Clustering on USArrests Dataset", x = "Principal
Component 1", y = "Principal Component 2") +
theme_minimal()

Mirrored Morality - Moral Choices in Videogames (Weaver & Lewis, 2012) - VG Researcher
No ratings yet
Mirrored Morality - Moral Choices in Videogames (Weaver & Lewis, 2012) - VG Researcher
7 pages
Rbi Grade B Depr Analysis and Pyqs
No ratings yet
Rbi Grade B Depr Analysis and Pyqs
17 pages
File 2
No ratings yet
File 2
17 pages
M Bda
No ratings yet
M Bda
19 pages
R Program 2025,-1
No ratings yet
R Program 2025,-1
11 pages
WEEK
No ratings yet
WEEK
17 pages
R Lab Program
No ratings yet
R Lab Program
20 pages
BDA Lab Manual (12 Weeks)
No ratings yet
BDA Lab Manual (12 Weeks)
22 pages
Data_scinece_practical_file
No ratings yet
Data_scinece_practical_file
23 pages
MY R
No ratings yet
MY R
11 pages
DATAMINING
No ratings yet
DATAMINING
24 pages
bd
No ratings yet
bd
12 pages
shahun term workR1
No ratings yet
shahun term workR1
34 pages
R_language Lab Manual_pg 2024
No ratings yet
R_language Lab Manual_pg 2024
29 pages
R- language
No ratings yet
R- language
23 pages
Toc ch1
No ratings yet
Toc ch1
9 pages
r file code
No ratings yet
r file code
16 pages
R lab Manual
No ratings yet
R lab Manual
22 pages
R Lab Manual (1)_merged
No ratings yet
R Lab Manual (1)_merged
25 pages
R Programs
No ratings yet
R Programs
12 pages
DA all (1)
No ratings yet
DA all (1)
15 pages
Datamining Lab Record
No ratings yet
Datamining Lab Record
36 pages
Dav Pracs
No ratings yet
Dav Pracs
9 pages
R Lab File Deepak
No ratings yet
R Lab File Deepak
27 pages
Lab file AD pdf
No ratings yet
Lab file AD pdf
25 pages
DM lab
No ratings yet
DM lab
18 pages
A Short List of Some Useful R Commands: Input and Display
No ratings yet
A Short List of Some Useful R Commands: Input and Display
2 pages
r program
No ratings yet
r program
22 pages
Data Science Lab Manual (R-Lab) Mca III Semester
No ratings yet
Data Science Lab Manual (R-Lab) Mca III Semester
2 pages
to edit data science
No ratings yet
to edit data science
18 pages
Final Data Lab
No ratings yet
Final Data Lab
21 pages
R Programming Practical File
No ratings yet
R Programming Practical File
38 pages
Data Sci Practical
No ratings yet
Data Sci Practical
8 pages
Workshop Activity: X Seq y Length
No ratings yet
Workshop Activity: X Seq y Length
3 pages
Session Set Working Directory Choose Directlry
No ratings yet
Session Set Working Directory Choose Directlry
17 pages
lab_taskR
No ratings yet
lab_taskR
6 pages
CS605 DA
No ratings yet
CS605 DA
21 pages
R16
No ratings yet
R16
55 pages
R Examples
No ratings yet
R Examples
56 pages
Big Data Slip Solution
No ratings yet
Big Data Slip Solution
18 pages
1
No ratings yet
1
19 pages
DA_Lab_Week-1
No ratings yet
DA_Lab_Week-1
7 pages
Wise CLZ R Programming 2022 Cse 2 2 Sem R20
No ratings yet
Wise CLZ R Programming 2022 Cse 2 2 Sem R20
49 pages
BAN5
No ratings yet
BAN5
2 pages
Datamining 2
No ratings yet
Datamining 2
54 pages
R Programming Lab
No ratings yet
R Programming Lab
14 pages
R Course
No ratings yet
R Course
7 pages
da thoery
No ratings yet
da thoery
24 pages
Final Cost Practical
No ratings yet
Final Cost Practical
29 pages
DM Slip Solutions
100% (1)
DM Slip Solutions
24 pages
Iba Cia 3
No ratings yet
Iba Cia 3
9 pages
datamining
No ratings yet
datamining
20 pages
Aman DA 111
No ratings yet
Aman DA 111
14 pages
7406HW02-1
No ratings yet
7406HW02-1
3 pages
7f18e5b8-c197-4086-98da-243347927150
No ratings yet
7f18e5b8-c197-4086-98da-243347927150
3 pages
IBS Sample I
No ratings yet
IBS Sample I
10 pages
Worksheet Classification2
No ratings yet
Worksheet Classification2
14 pages
Introduction To R For Gene Expression Data Analysis
No ratings yet
Introduction To R For Gene Expression Data Analysis
11 pages
R Manual
No ratings yet
R Manual
10 pages
R Programmimg Practical Journal All-1
No ratings yet
R Programmimg Practical Journal All-1
25 pages
Lisp Programming Language
From Everand
Lisp Programming Language
Faiz ul haque Zeya
No ratings yet
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
2023 Does Information Asymmetry
No ratings yet
2023 Does Information Asymmetry
27 pages
Spss Assignment 2
No ratings yet
Spss Assignment 2
2 pages
Outreg2(1)
No ratings yet
Outreg2(1)
34 pages
Yaregal Birhanu
No ratings yet
Yaregal Birhanu
8 pages
ARMA and ARIMA TJ Academy
No ratings yet
ARMA and ARIMA TJ Academy
6 pages
Mkt3mre Spss Workshops
No ratings yet
Mkt3mre Spss Workshops
111 pages
أثر عمليات اعادة التأمين على الأداء المالي لشركات التأمينات العامة المصرية ؛ دراسة كمية - محمد السيد حافظ ؛ مجلة الدراسات المالية والتجارية (تجارة بني سويف) ، ، مج29 ، ع2 ، 2019
No ratings yet
أثر عمليات اعادة التأمين على الأداء المالي لشركات التأمينات العامة المصرية ؛ دراسة كمية - محمد السيد حافظ ؛ مجلة الدراسات المالية والتجارية (تجارة بني سويف) ، ، مج29 ، ع2 ، 2019
42 pages
Using SPSS for Windows and Macintosh 8th Edition (eBook PDF) pdf download
100% (3)
Using SPSS for Windows and Macintosh 8th Edition (eBook PDF) pdf download
52 pages
Chapter 5.3-Mulitple Linear Regression
No ratings yet
Chapter 5.3-Mulitple Linear Regression
26 pages
Event History Analysis with Stata 2nd Edition Hans-Peter Blossfeld pdf download
No ratings yet
Event History Analysis with Stata 2nd Edition Hans-Peter Blossfeld pdf download
57 pages
Further Maths A Level 9231
100% (2)
Further Maths A Level 9231
30 pages
Aircraft Gas Turbine Engine Health Monitoring Syst
No ratings yet
Aircraft Gas Turbine Engine Health Monitoring Syst
13 pages
Identify and Explain The Different Plans of Work As Used in Library Classification
No ratings yet
Identify and Explain The Different Plans of Work As Used in Library Classification
7 pages
BIA Data Science Detailed Brochure - Vikhroli West, Mumbai-1
No ratings yet
BIA Data Science Detailed Brochure - Vikhroli West, Mumbai-1
28 pages
Occupational Schools Regular Schools
No ratings yet
Occupational Schools Regular Schools
31 pages
Chem-7 Domestic v2012.01.02 Operator Manual
No ratings yet
Chem-7 Domestic v2012.01.02 Operator Manual
101 pages
Role of Financial System in Economic Development
No ratings yet
Role of Financial System in Economic Development
22 pages
Predicting Student Stress Levels Based on Daily RESEARCH PAPER Li(1)
No ratings yet
Predicting Student Stress Levels Based on Daily RESEARCH PAPER Li(1)
15 pages
Big Data Chapter 2
No ratings yet
Big Data Chapter 2
62 pages
Entry Mode Strategies and Performance of Japanese Mncs in Australia and New Zealand: The Role of Japanese Employees
No ratings yet
Entry Mode Strategies and Performance of Japanese Mncs in Australia and New Zealand: The Role of Japanese Employees
19 pages
Instant Download (eBook PDF) Business Statistics, Global Edition 4h Edition PDF All Chapters
100% (2)
Instant Download (eBook PDF) Business Statistics, Global Edition 4h Edition PDF All Chapters
41 pages
Foundation Program 2021-22 Case Study and Report Generation CASE - 1 (Extra) Hindustan Housing Company
No ratings yet
Foundation Program 2021-22 Case Study and Report Generation CASE - 1 (Extra) Hindustan Housing Company
5 pages
Arun Kumar
No ratings yet
Arun Kumar
7 pages
Lay-Off Analysis & Prediction System-1
No ratings yet
Lay-Off Analysis & Prediction System-1
9 pages
On Features of Fugue Subjects A Comparison of J S Bach and Later Composers
100% (1)
On Features of Fugue Subjects A Comparison of J S Bach and Later Composers
21 pages
Homoscedasticity, Heteroscedasticity and Multicollinearity
100% (1)
Homoscedasticity, Heteroscedasticity and Multicollinearity
10 pages
Trip Generation Manual 10 th Edition Institute Of Transportation Engineers all chapter instant download
50% (2)
Trip Generation Manual 10 th Edition Institute Of Transportation Engineers all chapter instant download
65 pages
The Prevalence and Correlates of Postcoital Dysphoria in Women PDF
No ratings yet
The Prevalence and Correlates of Postcoital Dysphoria in Women PDF
13 pages

File 2

Uploaded by

File 2

Uploaded by

17) Write an R program to print, get information, print variable values,

# Load the built-in dataset

# 1. Print the dataset

# 2. Get basic information about the dataset

print("Summary of the dataset:")

# 3. Print variable values

print("Values of 'group' variable:")

# 4. Sort the 'weight' variable in ascending order

sorted_df <- PlantGrowth[order(PlantGrowth$weight), ]

# 5. Analyze the data

sd_weight <- sd(PlantGrowth$weight)

boxplot(weight ~ group, data = PlantGrowth,

group_counts <- table(PlantGrowth$group)

num <- as.numeric(readline("Enter a number: "))

22) Write an R Program to print the following pattern

spaces <- 2 * (rows - i)

23) Write an R Program to print the following pattern

cat(rep("*", i), sep = "")

cat(rep("* ", i), sep = "") cat("\

25) Write an R Program to print the following pattern

cat(rep("* ", i), sep = "")

for (i in (rows - 1):1)

26) Write an R Program to process the dataset by using its functions.

summary_data <- data %>%

species_summary <- data %>%

dataset <- read_csv("preprocessed_diabetes_dataset.csv")

model <- lm(Glucose ~ BMI, data = dataset)

dataset$Predicted_Glucose <- predict(model, newdata = dataset)

plot <- ggplot(dataset, aes(x = BMI, y = Glucose)) +

geom_line(aes(y = Predicted_Glucose), color = "red", size = 1) + #

labs(title = "Linear Regression: Glucose vs BMI",

sample_index <- sample(1:nrow(iris), 0.7 * nrow(iris))

svm_model <- svm(Species ~ ., data = train_data, kernel = "linear")

conf_matrix <- table(Predicted = predictions, Actual = test_data$Species)

# Load necessary libraries

# Split data into training (70%) and testing (30%)

# Build decision tree model

# Plot the tree

sample_index <- sample(1:nrow(mtcars), 0.7 * nrow(mtcars))

nb_model <- naiveBayes(am ~ ., data = train_data)

conf_matrix <- table(Predicted = predictions, Actual = test_data$am)

accuracy <- sum(diag(conf_matrix)) / sum(conf_matrix)

# Install and load required libraries

# Load the dataset

# View the first few rows of the dataset

# Convert 'quality' to a factor (since it's the target variable)

# Set seed for reproducibility

# Train the KNN model (k = 3)

scaled_data <- scale(USArrests)

kmeans_result <- kmeans(scaled_data, centers = 3, nstart = 25)

USArrests$Cluster <- as.factor(kmeans_result$cluster)

pca_result <- prcomp(scaled_data)

pca_data <- data.frame(pca_result$x[, 1:2], Cluster = USArrests$Cluster)

ggplot(pca_data, aes(x = PC1, y = PC2, color = Cluster)) +

You might also like