0% found this document useful (0 votes)

20 views

Final Data Lab

Lab Manual

Uploaded by

pvarshinibca

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

20 views

Final Data Lab

Lab Manual

Uploaded by

pvarshinibca

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 21

DATA SCIENCE & MACHINE LEARNING

P23CAP26 LABORATORY

EX . NO: 1 - R AS CALCULATOR APPLICATION.

PROGRAM:

add <- function(x, y) {

return(x + y)
}

subtract <- function(x, y) {

return(x - y)
}

multiply <- function(x, y) {

return(x * y)
}

divide <- function(x, y) {

return(x / y)
}
print("Select operation.")
print("1.Add")
print("2.Subtract")
print("3.Multiply")
print("4.Divide")

choice = as.integer(readline(prompt="Enter choice[1/2/3/4]: "))

num1 = as.integer(readline(prompt="Enter first number: "))
num2 = as.integer(readline(prompt="Enter second number: "))
operator <- switch(choice,"+","-","*","/")
result <- switch(choice, add(num1, num2), subtract(num1, num2), multiply(num1,
num2), divide(num1, num2))
print(paste(num1, operator, num2, "=", result))

OUTPUT
EX.NO: 2 – DISCRIPTIVE STATISTICS ON R.

#MEAN#

how_was_the_day = c(2,3,4,3,5,4,2,1,3)

tot_day = sum(how_was_the_day)

cnt_day = length(how_was_the_day)

avg_for_day = tot_day / cnt_day

print(avg_for_day)

mean(how_was_the_day)

#MEDIAN#

a = c(200,400,1000,450,234,700)
median(a)

b = c(7000,4000,2000,1000,5000,5000)
median(b)
c = c(20,30,40,50,60)
median(c)

#MODE#

getmode <- function(v) {

uniqv <- unique(v)
uniqv[which.max(tabulate(match(v, uniqv)))]
}
sale <- c(10,45,67,30,60,34,59,90)

result <- getmode(sale)

print(result)

OUTPUT
EX . NO: 3 - READING AND WRITING DIFFERENT TYPES OF DATASETS

PROGRAM:
# Install necessary packages
install.packages("readr")

install.packages("readxl")
install.packages("writexl")
install.packages("haven")

# Load the packages

library(readr)
library(readxl)
library(writexl)

library(haven)

# CSV Files
df_csv <- read_csv("file.csv")
write_csv(df_csv, "output.csv")

# Excel Files (XLSX)

df_excel <- read_excel("file.xlsx")
write_xlsx(df_excel, "output.xlsx")

# Text Files (Tab-Delimited)

df_tsv <- read_tsv("file.tsv")
write_tsv(df_tsv, "output.tsv")
OUTPUT:
EX.NO: 4. VISUALIZATION.

PROGRAM:

library(lattice)
library(datasets)
mtcars
str(mtcars)
1.#HISTOGRAM#
histogram(~mpg,data=mtcars)
2.#BOX PLOT#
bwplot(~mpg,data=mtcars)
3.#DENSITY PLOT#
densityplot(~mpg,data=mtcars)
4.#BAR GRAPH#
barchart(~mpg,data=mtcars)
OUTPUT:

HISTOGRAM

BOXPLOT

DENSITY PLOT
BAR GRAPH
EX.NO:5 CORRELATION AND COVARIANCE

PROGRAM:
x <- c(2, 4, 6, 8, 10)

y <- c(1, 3, 2, 5, 7)

#COVARIANCE#

cov_xy <- cov(x, y)

cat("Covariance between x and y:", cov_xy, "\n")

#CORRELATION#

cor_xy <- cor(x, y)

cat("Correlation between x and y:", cor_xy, "\n")

OUTPUT:
6.REGRESSION MODEL

# Set seed for reproducibility

set.seed(42)

# Generate data
x <- rnorm(100, mean = 5, sd = 2)
y <- 3 + 2 * x + rnorm(100)

# Fit linear model

model <- lm(y ~ x)

# Summary of the model

print(summary(model))

# Plot the data and regression line using base R

plot(x, y, main = "Scatter Plot with Regression Line", xlab = "x", ylab = "y")
abline(model, col = "blue")

OUTPUT:
7.Multiple regression

install.packages("tidyverse")

library(tidyverse)

data(mtcars)

head(mtcars)

model <- lm(mpg ~ hp + wt + cyl, data = mtcars)

summary(model)

new_data <- tibble(hp = c(150, 200), wt = c(2.5, 3.0), cyl = c(4, 6))

predictions <- predict(model, newdata = new_data)

print(predictions)

par(mfrow = c(2, 2))

plot(model)

Output:
print(predictions)
1 2
24.36217 19.99355

Plot:
EX.NO: 8. Regression model for prediction
# Load necessary libraries

library(ggplot2) # For visualization

# Load the dataset

data(mtcars)

# Explore the dataset

head(mtcars)

summary(mtcars)

# Fit a linear regression model

# Predicting 'mpg' based on 'wt' and 'hp'

model <- lm(mpg ~ wt + hp, data = mtcars)

# Display the summary of the model

summary(model)

# Create a new data frame for predictions

new_data <- data.frame(wt = c(2.5, 3.0, 3.5), hp = c(100, 120, 150))

# Make predictions

predictions <- predict(model, new_data)

# Print the predictions

cat("Predictions for new data:\n")

print(predictions)

# Add predictions to the original dataset for visualization

mtcars$predicted_mpg <- predict(model, mtcars)

# Plot actual vs. predicted mpg

ggplot(mtcars, aes(x = mpg, y = predicted_mpg)) +

geom_point(color = "blue") +

geom_abline(intercept = 0, slope = 1, color = "red") +

labs(title = "Actual vs. Predicted MPG",

x = "Actual MPG",

y = "Predicted MPG") +

theme_minimal()

OUTPUT :
EX.NO : 9 – CLASSIFICATION MODEL.

PROGRAM:
# Install and load necessary packages

install.packages("caret")
install.packages("randomForest")
library(caret)
library(randomForest)

# Load the dataset

data(iris)
# Split data into training and testing sets
set.seed(123) # for reproducibility
trainIndex <- createDataPartition(iris$Species, p = 0.7, list = FALSE)

trainData <- iris[trainIndex, ]

testData <- iris[-trainIndex, ]

# Train a Random Forest model

model <- train(Species ~ ., data = trainData, method = "rf")

# Make predictions on the test set

predictions <- predict(model, newdata = testData)

# Evaluate model performance

confMatrix <- confusionMatrix(predictions, testData$Species)

print(confMatrix)

OUTPUT :

Confusion Matrix and Statistics

Reference
Prediction setosa versicolor virginica
setosa 15 0 0
versicolor 0 14 2
virginica 0 1 13

Overall Statistics

Accuracy : 0.9333
95% CI : (0.8173, 0.986)
No Information Rate : 0.3333
P-Value [Acc > NIR] : < 2.2e-16

Kappa : 0.9
Mcnemar's Test P-Value : NA

Statistics by Class:

Class: setosa Class: versicolor Class: virginica

Sensitivity 1.0000 0.9333 0.8667
Specificity 1.0000 0.9333 0.9667
Pos Pred Value 1.0000 0.8750 0.9286
Neg Pred Value 1.0000 0.9655 0.9355
Prevalence 0.3333 0.3333 0.3333
Detection Rate 0.3333 0.3111 0.2889
Detection Prevalence 0.3333 0.3556 0.3111
Balanced Accuracy 1.0000 0.9333 0.9167

EX.NO : 10. CLUSTERING MODE

PROGRAM:
# Load necessary package

set.seed(123) # For reproducibility

# Load the iris dataset

data(iris)

# Remove the species column for clustering

iris_data <- iris[, -5]

# Perform K-means clustering with 3 clusters

kmeans_result <- kmeans(iris_data, centers = 3, nstart = 20)

# View the clustering results

print(kmeans_result$cluster)

# Add cluster information to the original dataset

iris$Cluster <- as.factor(kmeans_result$cluster)

# Plot the clusters

library(ggplot2)

ggplot(iris, aes(x = Petal.Length, y = Petal.Width, color = Cluster)) +

geom_point(size = 3) +
labs(title = "K-means Clustering of Iris Dataset") +
theme_minimal()
OUTPUT:

SiPass Integrated HR-API Programmers Reference Manual PDF
0% (1)
SiPass Integrated HR-API Programmers Reference Manual PDF
94 pages
Multisim Tutorial PDF
100% (1)
Multisim Tutorial PDF
13 pages
Final Data Lab
No ratings yet
Final Data Lab
20 pages
Da Lab It
No ratings yet
Da Lab It
20 pages
saurabh
No ratings yet
saurabh
22 pages
WEEK
No ratings yet
WEEK
17 pages
Lab file AD pdf
No ratings yet
Lab file AD pdf
25 pages
R-programming -Final Lab Manual-2022 (1)
No ratings yet
R-programming -Final Lab Manual-2022 (1)
31 pages
R Studio Practicals-1
No ratings yet
R Studio Practicals-1
29 pages
If With: February 26, 2024
No ratings yet
If With: February 26, 2024
7 pages
R-Lab p-4,2,1
No ratings yet
R-Lab p-4,2,1
12 pages
Project
No ratings yet
Project
17 pages
2.3 Aiml Rishit
No ratings yet
2.3 Aiml Rishit
7 pages
Machine Failure Prediction
No ratings yet
Machine Failure Prediction
11 pages
Functions and Packages
No ratings yet
Functions and Packages
7 pages
1740193353052_Practical 1
No ratings yet
1740193353052_Practical 1
10 pages
DEEP LEARNING EXPERIMENTS
No ratings yet
DEEP LEARNING EXPERIMENTS
42 pages
ML Lab Programs For Exam
No ratings yet
ML Lab Programs For Exam
10 pages
Deep Learning Practical
No ratings yet
Deep Learning Practical
12 pages
Lab Manual R - Std
No ratings yet
Lab Manual R - Std
17 pages
Rstudio Study Notes For PA 20181126
No ratings yet
Rstudio Study Notes For PA 20181126
6 pages
Cran.r2021-Linear Regression and Logistic Regression With Missing Covariates
No ratings yet
Cran.r2021-Linear Regression and Logistic Regression With Missing Covariates
10 pages
AIML Record 56
No ratings yet
AIML Record 56
28 pages
Python Programming PART A Lab Manual
No ratings yet
Python Programming PART A Lab Manual
5 pages
DM Practice
No ratings yet
DM Practice
15 pages
CPI.vt (1)
No ratings yet
CPI.vt (1)
11 pages
R Programming
No ratings yet
R Programming
4 pages
MlLabManualdocx 2024 09 04 22 02 58
No ratings yet
MlLabManualdocx 2024 09 04 22 02 58
19 pages
SML Practical 1to11
No ratings yet
SML Practical 1to11
23 pages
DM Slip Solutions
100% (1)
DM Slip Solutions
24 pages
AI Final PDF
No ratings yet
AI Final PDF
38 pages
FDL 4 5 Print Merged
No ratings yet
FDL 4 5 Print Merged
11 pages
Decision_Tree_Regression.ipynb - Colab
No ratings yet
Decision_Tree_Regression.ipynb - Colab
3 pages
Brain Tumor Classification
100% (1)
Brain Tumor Classification
12 pages
ml exp 3-7 manuval
No ratings yet
ml exp 3-7 manuval
21 pages
K Means
No ratings yet
K Means
4 pages
629 ML Assignment
No ratings yet
629 ML Assignment
6 pages
From Import Import As Import As From Import From Import From Import From Import
No ratings yet
From Import Import As Import As From Import From Import From Import From Import
9 pages
ML Lab Programs
No ratings yet
ML Lab Programs
23 pages
DA Lab 1-7
No ratings yet
DA Lab 1-7
26 pages
PR
No ratings yet
PR
17 pages
Kanish 9-12
No ratings yet
Kanish 9-12
18 pages
Python Lab Manual Biet
No ratings yet
Python Lab Manual Biet
16 pages
heartbeat-disease-classifier (1)
No ratings yet
heartbeat-disease-classifier (1)
21 pages
ML2 Practical List
No ratings yet
ML2 Practical List
80 pages
DL_0801CS223D04_Assignment5.ipynb - Colab
No ratings yet
DL_0801CS223D04_Assignment5.ipynb - Colab
15 pages
Bilal Ahmad Ai & DSS Assign # 03
No ratings yet
Bilal Ahmad Ai & DSS Assign # 03
7 pages
Grid Search For SVM
No ratings yet
Grid Search For SVM
9 pages
Lecture 21
No ratings yet
Lecture 21
138 pages
Applied Machine and Deep Learning
No ratings yet
Applied Machine and Deep Learning
34 pages
Introduction To Basics of R - Assignment: Log2 (2 5) Log (Exp (1) Exp (2) )
No ratings yet
Introduction To Basics of R - Assignment: Log2 (2 5) Log (Exp (1) Exp (2) )
10 pages
Advance AI and ML LAB
No ratings yet
Advance AI and ML LAB
16 pages
Control Flow - Looping
No ratings yet
Control Flow - Looping
18 pages
Practical 5
No ratings yet
Practical 5
11 pages
Untitled 10
No ratings yet
Untitled 10
6 pages
BOSTON CON 3 VARIABLES - Ipynb - Colab
No ratings yet
BOSTON CON 3 VARIABLES - Ipynb - Colab
3 pages
Lab Assignment 3 Ai
No ratings yet
Lab Assignment 3 Ai
1 page
DOC-20241108-WA0003
No ratings yet
DOC-20241108-WA0003
16 pages
SML Practicals All
No ratings yet
SML Practicals All
22 pages
Linear SVM: 'Target'
No ratings yet
Linear SVM: 'Target'
13 pages
IR_Prac_2
No ratings yet
IR_Prac_2
4 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
4GT
No ratings yet
4GT
2 pages
Ineo+ - 224e - 284e - 364e - 454e - 554e - Product Guide - e - 130211 - F
No ratings yet
Ineo+ - 224e - 284e - 364e - 454e - 554e - Product Guide - e - 130211 - F
48 pages
"LUCAS" For The Amiga 1000: A 68020168881 Platform Board
No ratings yet
"LUCAS" For The Amiga 1000: A 68020168881 Platform Board
8 pages
Submit: Internet Questions and Answers Updated Daily - Computer Knowledge
No ratings yet
Submit: Internet Questions and Answers Updated Daily - Computer Knowledge
5 pages
NV Series V Series Programming Instructions (LD FBD SFC ST)
No ratings yet
NV Series V Series Programming Instructions (LD FBD SFC ST)
764 pages
SAP BAPI Training Material PDF
No ratings yet
SAP BAPI Training Material PDF
3 pages
USB Game Pad Manual
No ratings yet
USB Game Pad Manual
2 pages
23BCP113 Java File
No ratings yet
23BCP113 Java File
41 pages
ASUS UX561UD Manual
No ratings yet
ASUS UX561UD Manual
104 pages
CTCD Unit 4
No ratings yet
CTCD Unit 4
25 pages
CCN-lab 11
No ratings yet
CCN-lab 11
8 pages
Experiment 8
No ratings yet
Experiment 8
4 pages
USA Uncek 46
No ratings yet
USA Uncek 46
33 pages
OSI Reference Model: Standardization, in The Year 1984
No ratings yet
OSI Reference Model: Standardization, in The Year 1984
9 pages
Managing SGLX 11.19
No ratings yet
Managing SGLX 11.19
348 pages
Interview Questions For Check Point Firewall Technology
No ratings yet
Interview Questions For Check Point Firewall Technology
6 pages
B1 RC18 User Guide
No ratings yet
B1 RC18 User Guide
20 pages
Environmental Data Acquisition System: Air Quality Monitoring Systems
No ratings yet
Environmental Data Acquisition System: Air Quality Monitoring Systems
2 pages
Mobile Testing
No ratings yet
Mobile Testing
5 pages
Python Socket - Network Programming Tutorial
No ratings yet
Python Socket - Network Programming Tutorial
18 pages
Ibs PC SC SWD Um e 5333 en 05
No ratings yet
Ibs PC SC SWD Um e 5333 en 05
166 pages
Lect12 Cache
No ratings yet
Lect12 Cache
39 pages
Assignment 02
No ratings yet
Assignment 02
3 pages
Raoul Kernel Slides
No ratings yet
Raoul Kernel Slides
25 pages
Instruction
No ratings yet
Instruction
9 pages
ESP32 Project
No ratings yet
ESP32 Project
5 pages
Tools and Technologies For Software Engineer
No ratings yet
Tools and Technologies For Software Engineer
13 pages
UNIT - 1 Basics of Microcontroller & Intel 8051 Architecture
No ratings yet
UNIT - 1 Basics of Microcontroller & Intel 8051 Architecture
37 pages