0% found this document useful (0 votes)

9 views17 pages

File 2

The document contains a series of R programming tasks including data analysis using built-in datasets, implementing various algorithms such as Linear Regression, Support Vector Machine, Decision Trees, Naive Bayes, K-Nearest Neighbors, and K-Means Clustering. It also includes tasks for creating patterns with asterisks and calculating factorials. Each task is presented with code snippets demonstrating the implementation of the respective functionality.

Uploaded by

harshilsonibusiness

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

9 views17 pages

File 2

Uploaded by

harshilsonibusiness

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 17

17) Write an R program to print, get information, print variable values,

sort variable values and analyse data for the inbuilt dataset.

# Load the built-in dataset

data("PlantGrowth")

# 1. Print the dataset

print("Dataset - PlantGrowth:")
print(PlantGrowth)

# 2. Get basic information about the dataset

print("Structure of the dataset:")
str(PlantGrowth)

print("Summary of the dataset:")

summary(PlantGrowth)

# 3. Print variable values

print("Values of 'weight' variable:")
print(PlantGrowth$weight)

print("Values of 'group' variable:")

print(PlantGrowth$group)

# 4. Sort the 'weight' variable in ascending order

print("Sorted weights (ascending):")
print(sort(PlantGrowth$weight))

sorted_df <- PlantGrowth[order(PlantGrowth$weight), ]

print("Data frame sorted by weight:")
print(sorted_df)

# 5. Analyze the data

mean_weight <- mean(PlantGrowth$weight)
cat("Mean of weights:", mean_weight, "\n")

sd_weight <- sd(PlantGrowth$weight)

cat("Standard deviation of weights:", sd_weight, "\n")

boxplot(weight ~ group, data = PlantGrowth,

main = "Weight by Treatment Group",
xlab = "Group", ylab = "Weight",
col = c("lightblue", "lightgreen", "lightcoral"))

group_counts <- table(PlantGrowth$group)

print("Count of samples in each group:")
print(group_counts)
21) Write an R Program to find Factorial of a number.

num <- as.numeric(readline("Enter a number: "))

factorial <- 1
if (num >= 0) {
for (i in 1:num)
{
factorial <- factorial * i
}
cat("Factorial of", num, "is:", factorial, "\n")
} else {
cat("Factorial is not defined for negative numbers.\n")
}

22) Write an R Program to print the following pattern

* *
** **
*** ***
*******

rows <- 4
for (i in 1:rows)
{ cat(rep("*", i), sep =
"")

spaces <- 2 * (rows - i)

cat(rep(" ", spaces), sep = "")
cat(rep("*", i), sep = "") cat("\
n")
}

23) Write an R Program to print the following pattern

*
**
***
****
rows <- 4
for (i in 1:rows) {
cat(rep(" ", rows - i), sep = "")

cat(rep("*", i), sep = "")

cat("\n")
}
24) Write an R Program to print the following pattern
*
**
***
****
rows <- 4
for (i in 1:rows) {
cat(rep(" ", rows - i), sep = "")

cat(rep("* ", i), sep = "") cat("\

n")
}

25) Write an R Program to print the following pattern

*
***
*****
***
*
rows <- 3
for (i in 1:rows) {
cat(rep(" ", rows - i), sep = "")

cat(rep("* ", i), sep = "")

cat("\n")
}

for (i in (rows - 1):1)

{ cat(rep(" ", rows - i), sep =
"")
cat(rep("* ", i), sep = "")

cat("\n")
}

26) Write an R Program to process the dataset by using its functions.

library(dplyr)
data <- iris
head(data)
sum(is.na(data))

summary_data <- data %>%

summarise(mean_Sepal.Length = mean(Sepal.Length, na.rm = TRUE),
max_Sepal.Length = max(Sepal.Length, na.rm = TRUE),
min_Sepal.Length = min(Sepal.Length, na.rm = TRUE))

species_summary <- data %>%

group_by(Species) %>%
summarise(mean_Sepal.Length = mean(Sepal.Length, na.rm = TRUE))

print(summary_data)
print(species_summary)

plot(data$Sepal.Length,
data$Sepal.Width, main = "Sepal
Length vs Sepal Width",
xlab = "Sepal Length", ylab = "Sepal Width",
col = data$Species, pch = 19)
27) Write an R Program to implement Linear Regression Algorithm.

library(ggplot2)
library(readr)
library(caret)

dataset <- read_csv("preprocessed_diabetes_dataset.csv")

head(dataset)

model <- lm(Glucose ~ BMI, data = dataset)

summary(model)

dataset$Predicted_Glucose <- predict(model, newdata = dataset)

plot <- ggplot(dataset, aes(x = BMI, y = Glucose)) +

geom_point(color = "blue", alpha = 0.5) + # Scatter plot of actual
values

geom_line(aes(y = Predicted_Glucose), color = "red", size = 1) + #

Regression line

labs(title = "Linear Regression: Glucose vs BMI",

x = "BMI",
y = "Glucose") +
theme_minimal()

print(plot)
28) Write an R program to implement a Support Vector
Machine Algorithm.

if (!require(e1071)) {
install.packages("e1071")
library(e1071)
}
data(iris)
set.seed(123)

sample_index <- sample(1:nrow(iris), 0.7 * nrow(iris))

train_data <- iris[sample_index, ]
test_data <- iris[-sample_index, ]

svm_model <- svm(Species ~ ., data = train_data, kernel = "linear")

predictions <- predict(svm_model, test_data)

conf_matrix <- table(Predicted = predictions, Actual = test_data$Species)

print(conf_matrix)
accuracy <- sum(diag(conf_matrix)) / sum(conf_matrix)
cat("Accuracy:", round(accuracy * 100, 2), "%\n")
29) Write an R program to implement a Decision Tree Algorithm.

# Load necessary libraries

if (!require(rpart)) install.packages("rpart")
if (!require(rpart.plot)) install.packages("rpart.plot")
library(rpart)
library(rpart.plot)

# Load dataset
diabetes <- read.csv("diabetes_data.csv")

# Set seed
set.seed(123)

# Split data into training (70%) and testing (30%)

sample_index <- sample(1:nrow(diabetes), 0.7 * nrow(diabetes))
train_data <- diabetes[sample_index, ]
test_data <- diabetes[-sample_index, ]

# Build decision tree model

tree_model <- rpart(Outcome ~ ., data = train_data, method = "class")

# Plot the tree

rpart.plot(tree_model, main = "Decision Tree for Diabetes Prediction")

# Make predictions
predictions <- predict(tree_model, test_data, type = "class")
# Confusion matrix
conf_matrix <- table(Predicted = predictions, Actual =
test_data$Outcome)
print(conf_matrix)

# Accuracy
accuracy <- sum(diag(conf_matrix)) / sum(conf_matrix)
cat("Accuracy:", round(accuracy * 100, 2), "%\n")
30) Write an R program to implement a Naive Bayes Algorithm.
if (!require(e1071)) {
install.packages("e1071")
library(e1071)
}

data(mtcars)
mtcars$am <- as.factor(mtcars$am)
set.seed(123)

sample_index <- sample(1:nrow(mtcars), 0.7 * nrow(mtcars))

train_data <- mtcars[sample_index, ]
test_data <- mtcars[-sample_index, ]

nb_model <- naiveBayes(am ~ ., data = train_data)

predictions <- predict(nb_model, test_data)

conf_matrix <- table(Predicted = predictions, Actual = test_data$am)

print(conf_matrix)

accuracy <- sum(diag(conf_matrix)) / sum(conf_matrix)

cat("Accuracy:", round(accuracy * 100, 2), "%\n")
31) Write an R program to implement a K-Nearest
Neighbour Algorithm.

# Install and load required libraries

if (!require(class)) {
install.packages("class")
library(class)
}

# Load the dataset

wine_data <- read.csv("redwinequality.csv")

# View the first few rows of the dataset

head(wine_data)

# Convert 'quality' to a factor (since it's the target variable)

wine_data$quality <- as.factor(wine_data$quality)

# Set seed for reproducibility

set.seed(123)

# Split the dataset into training (70%) and testing (30%) sets
sample_index <- sample(1:nrow(wine_data), 0.7 * nrow(wine_data))
train_data <- wine_data[sample_index, ]
test_data <- wine_data[-sample_index, ]

# Separate features and target variable for both train and test sets
train_x <- train_data[, -ncol(wine_data)] # All columns except 'quality'
train_y <- train_data$quality # Target variable (quality)
test_x <- test_data[, -ncol(wine_data)] # All columns except
'quality' test_y <- test_data$quality # Target variable (quality)

# Train the KNN model (k = 3)

k_value <- 3
knn_predictions <- knn(train_x, test_x, train_y, k = k_value)

# Confusion matrix
conf_matrix <- table(Predicted = knn_predictions, Actual = test_y)
print(conf_matrix)

# Calculate accuracy
accuracy <- sum(diag(conf_matrix)) / sum(conf_matrix)
cat("Accuracy:", round(accuracy * 100, 2), "%\n")
32) Write an R program to implement a K-Means
Clustering Algorithm.

data("USArrests")
head(USArrests)
USArrests <- na.omit(USArrests)

scaled_data <- scale(USArrests)

set.seed(123)

kmeans_result <- kmeans(scaled_data, centers = 3, nstart = 25)

print(kmeans_result)

USArrests$Cluster <- as.factor(kmeans_result$cluster)

if (!require(ggplot2)) {
install.packages("ggplot2")
library(ggplot2)
}

pca_result <- prcomp(scaled_data)

pca_data <- data.frame(pca_result$x[, 1:2], Cluster = USArrests$Cluster)

ggplot(pca_data, aes(x = PC1, y = PC2, color = Cluster)) +

geom_point(size = 3) +
labs(title = "K-means Clustering on USArrests Dataset", x = "Principal
Component 1", y = "Principal Component 2") +
theme_minimal()

File 2
No ratings yet
File 2
17 pages
M Bda
No ratings yet
M Bda
19 pages
R Program 2025,-1
No ratings yet
R Program 2025,-1
11 pages
WEEK
No ratings yet
WEEK
17 pages
R Lab Program
No ratings yet
R Lab Program
20 pages
BDA Lab Manual (12 Weeks)
No ratings yet
BDA Lab Manual (12 Weeks)
22 pages
Data Scinece Practical File
No ratings yet
Data Scinece Practical File
23 pages
Write A R Program For Different Types of Data Structures
No ratings yet
Write A R Program For Different Types of Data Structures
11 pages
DATAMINING
No ratings yet
DATAMINING
24 pages
BD
No ratings yet
BD
12 pages
Shahun Term Workr1
No ratings yet
Shahun Term Workr1
34 pages
R - Language Lab Manual - PG 2024
No ratings yet
R - Language Lab Manual - PG 2024
29 pages
R - Language
No ratings yet
R - Language
23 pages
R Code Compact
No ratings yet
R Code Compact
10 pages
Toc ch1
No ratings yet
Toc ch1
9 pages
R File Code
No ratings yet
R File Code
16 pages
EXXAM
No ratings yet
EXXAM
3 pages
R Lab Manual
No ratings yet
R Lab Manual
22 pages
R Lab Manual (1) - Merged
No ratings yet
R Lab Manual (1) - Merged
25 pages
R Programs
No ratings yet
R Programs
12 pages
DA All
No ratings yet
DA All
15 pages
Datamining Lab Record
No ratings yet
Datamining Lab Record
36 pages
Dav Pracs
No ratings yet
Dav Pracs
9 pages
Rlab
No ratings yet
Rlab
7 pages
R Lab File Deepak
No ratings yet
R Lab File Deepak
27 pages
Lab File AD PDF
No ratings yet
Lab File AD PDF
25 pages
DM Lab
No ratings yet
DM Lab
18 pages
A Short List of Some Useful R Commands: Input and Display
No ratings yet
A Short List of Some Useful R Commands: Input and Display
2 pages
R Program
No ratings yet
R Program
22 pages
Data Science Lab Manual (R-Lab) Mca III Semester
No ratings yet
Data Science Lab Manual (R-Lab) Mca III Semester
2 pages
To Edit Data Science
No ratings yet
To Edit Data Science
18 pages
Final Data Lab
No ratings yet
Final Data Lab
21 pages
R Programming Exercises
No ratings yet
R Programming Exercises
38 pages
Data Sci Practical
No ratings yet
Data Sci Practical
8 pages
Workshop Activity: X Seq y Length
No ratings yet
Workshop Activity: X Seq y Length
3 pages
Session Set Working Directory Choose Directlry
No ratings yet
Session Set Working Directory Choose Directlry
17 pages
Lab Taskr
No ratings yet
Lab Taskr
6 pages
CS605 Da
No ratings yet
CS605 Da
21 pages
Certificate: Alard College of Business Studies
No ratings yet
Certificate: Alard College of Business Studies
55 pages
R Examples
No ratings yet
R Examples
56 pages
Big Data Slip Solution
No ratings yet
Big Data Slip Solution
18 pages
1
No ratings yet
1
19 pages
DA Lab Week-1
No ratings yet
DA Lab Week-1
7 pages
Wise CLZ R Programming 2022 Cse 2 2 Sem R20
No ratings yet
Wise CLZ R Programming 2022 Cse 2 2 Sem R20
49 pages
BAN5
No ratings yet
BAN5
2 pages
Datamining 2
No ratings yet
Datamining 2
54 pages
R Programming Lab
No ratings yet
R Programming Lab
14 pages
R Course
No ratings yet
R Course
7 pages
Da Thoery
No ratings yet
Da Thoery
24 pages
Final Cost Practical
No ratings yet
Final Cost Practical
29 pages
DM Slip Solutions
100% (1)
DM Slip Solutions
24 pages
Iba Cia 3
No ratings yet
Iba Cia 3
9 pages
Datamining
No ratings yet
Datamining
20 pages
Aman DA 111
No ratings yet
Aman DA 111
14 pages
7406HW02 1
No ratings yet
7406HW02 1
3 pages
7f18e5b8-c197-4086-98da-243347927150
No ratings yet
7f18e5b8-c197-4086-98da-243347927150
3 pages
IBS Sample I
No ratings yet
IBS Sample I
10 pages
Introduction To R For Gene Expression Data Analysis
No ratings yet
Introduction To R For Gene Expression Data Analysis
11 pages
Prob Stats Module 3
No ratings yet
Prob Stats Module 3
49 pages
Trần Mạnh Hùng 20192643.Ipynb - Colab
No ratings yet
Trần Mạnh Hùng 20192643.Ipynb - Colab
6 pages
Assignment 2
No ratings yet
Assignment 2
2 pages
Linear Regression with Excel Toolpak
No ratings yet
Linear Regression with Excel Toolpak
3 pages
Final Examination StatS - 20DAVID - 20JUDYANN - 20G - 20MAED MAPEH
No ratings yet
Final Examination StatS - 20DAVID - 20JUDYANN - 20G - 20MAED MAPEH
8 pages
DSF - UNIT III Notes
No ratings yet
DSF - UNIT III Notes
17 pages
MODULE 4-Dr - GM
No ratings yet
MODULE 4-Dr - GM
23 pages
Reading 2 Time Series Analysis
No ratings yet
Reading 2 Time Series Analysis
22 pages
Supervised Learning with Scikit-Learn
No ratings yet
Supervised Learning with Scikit-Learn
178 pages
Nonlinear Regression & Interaction Terms
No ratings yet
Nonlinear Regression & Interaction Terms
2 pages
Outliers and Influential Observations
No ratings yet
Outliers and Influential Observations
5 pages
Predicting The Term Deposit Subscription
No ratings yet
Predicting The Term Deposit Subscription
38 pages
Exanova
No ratings yet
Exanova
3 pages
Binary Logistic Regression Guide
No ratings yet
Binary Logistic Regression Guide
16 pages
Gatsonis 1989
No ratings yet
Gatsonis 1989
9 pages
Confusion Matrix
No ratings yet
Confusion Matrix
14 pages
Regression Analysis
No ratings yet
Regression Analysis
6 pages
Linear Regression & Correlation Guide
No ratings yet
Linear Regression & Correlation Guide
5 pages
Notes On Module 3 - Pattern Recognition
No ratings yet
Notes On Module 3 - Pattern Recognition
17 pages
Exp 15
No ratings yet
Exp 15
12 pages
T Test
No ratings yet
T Test
17 pages
MLP - Iv Eee
No ratings yet
MLP - Iv Eee
36 pages
Machine Learning Master Class: Warriors Way
No ratings yet
Machine Learning Master Class: Warriors Way
3 pages
PPP Models - ARIMA & NARNN - Ipynb - Colaboratory
No ratings yet
PPP Models - ARIMA & NARNN - Ipynb - Colaboratory
8 pages
Correlation Analysis in SPSS Guide
100% (1)
Correlation Analysis in SPSS Guide
2 pages
Usage of Color Measurements Obtained by Modified Seliwanoff Test To Determine Hydroxymethylfurfural
No ratings yet
Usage of Color Measurements Obtained by Modified Seliwanoff Test To Determine Hydroxymethylfurfural
8 pages
Regrassion Analysis Lab Question and Answer
No ratings yet
Regrassion Analysis Lab Question and Answer
13 pages
Answers:: Fin1131/Fin3154 First Semester, AY 2020-2021 Laboratory Activity 3
No ratings yet
Answers:: Fin1131/Fin3154 First Semester, AY 2020-2021 Laboratory Activity 3
4 pages
Autocorrelation
No ratings yet
Autocorrelation
4 pages
SPSS Binary Logistic Regression Demo 1 Terminate
100% (1)
SPSS Binary Logistic Regression Demo 1 Terminate
22 pages

File 2

Uploaded by

File 2

Uploaded by

17) Write an R program to print, get information, print variable values,

# Load the built-in dataset

# 1. Print the dataset

# 2. Get basic information about the dataset

print("Summary of the dataset:")

# 3. Print variable values

print("Values of 'group' variable:")

# 4. Sort the 'weight' variable in ascending order

sorted_df <- PlantGrowth[order(PlantGrowth$weight), ]

# 5. Analyze the data

sd_weight <- sd(PlantGrowth$weight)

boxplot(weight ~ group, data = PlantGrowth,

group_counts <- table(PlantGrowth$group)

num <- as.numeric(readline("Enter a number: "))

22) Write an R Program to print the following pattern

spaces <- 2 * (rows - i)

23) Write an R Program to print the following pattern

cat(rep("*", i), sep = "")

cat(rep("* ", i), sep = "") cat("\

25) Write an R Program to print the following pattern

cat(rep("* ", i), sep = "")

for (i in (rows - 1):1)

26) Write an R Program to process the dataset by using its functions.

summary_data <- data %>%

species_summary <- data %>%

dataset <- read_csv("preprocessed_diabetes_dataset.csv")

model <- lm(Glucose ~ BMI, data = dataset)

dataset$Predicted_Glucose <- predict(model, newdata = dataset)

plot <- ggplot(dataset, aes(x = BMI, y = Glucose)) +

geom_line(aes(y = Predicted_Glucose), color = "red", size = 1) + #

labs(title = "Linear Regression: Glucose vs BMI",

sample_index <- sample(1:nrow(iris), 0.7 * nrow(iris))

svm_model <- svm(Species ~ ., data = train_data, kernel = "linear")

conf_matrix <- table(Predicted = predictions, Actual = test_data$Species)

# Load necessary libraries

# Split data into training (70%) and testing (30%)

# Build decision tree model

# Plot the tree

sample_index <- sample(1:nrow(mtcars), 0.7 * nrow(mtcars))

nb_model <- naiveBayes(am ~ ., data = train_data)

conf_matrix <- table(Predicted = predictions, Actual = test_data$am)

accuracy <- sum(diag(conf_matrix)) / sum(conf_matrix)

# Install and load required libraries

# Load the dataset

# View the first few rows of the dataset

# Convert 'quality' to a factor (since it's the target variable)

# Set seed for reproducibility

# Train the KNN model (k = 3)

scaled_data <- scale(USArrests)

kmeans_result <- kmeans(scaled_data, centers = 3, nstart = 25)

USArrests$Cluster <- as.factor(kmeans_result$cluster)

pca_result <- prcomp(scaled_data)

pca_data <- data.frame(pca_result$x[, 1:2], Cluster = USArrests$Cluster)

ggplot(pca_data, aes(x = PC1, y = PC2, color = Cluster)) +

You might also like