0% found this document useful (0 votes)

29 views

ML Assignment 01 Code

The document discusses performing principal component analysis (PCA) on the Iris dataset using Python and Scikit-learn. It loads and explores the Iris data, performs PCA to reduce the dimensions, and analyzes the results including the number of components retained, explained variance, and feature contributions to the principal components.

Uploaded by

Awais Khan

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

29 views

ML Assignment 01 Code

Uploaded by

Awais Khan

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 21

Title

No category Today 8:07 PM

import numpy as np
import pandas as pd
from sklearn import datasets
from sklearn.decomposition import
PCA

# Load the Iris dataset

iris = datasets.load_iris()
data, columns = iris.data,
iris.feature_names

# Create a Pandas DataFrame from

the Iris dataset
df = pd.DataFrame(data,
columns=columns)

# Step 1: Mean normalize the features

normalized_data = (df - df.mean()) /
df.std()

# Step 2: Find the covariance matrix

covariance_matrix =
np.cov(normalized_data,
rowvar=False)

# Step 3: Find eigenvalues and

eigenvectors of the covariance matrix
eigenvalues, eigenvectors =
np.linalg.eig(covariance_matrix)

# Step 4: Arrange eigenvalues in

descending order
sorted_indices =
np.argsort(eigenvalues)[::-1]
sorted_eigenvalues =
eigenvalues[sorted_indices]
sorted_eigenvectors = eigenvectors[:,
sorted_indices]

# Step 5: Select eigenvalues that

retain the required variance
total_variance =
np.sum(sorted_eigenvalues)
variance_to_retain = 0.95
cumulative_variance =
np.cumsum(sorted_eigenvalues) /
total_variance
num_components_to_retain =
np.argmax(cumulative_variance >=
variance_to_retain) + 1

selected_eigenvalues =
sorted_eigenvalues[:num_component
s_to_retain]
selected_eigenvectors =
sorted_eigenvectors[:, :num_compone
nts_to_retain]
# Step 6: Transform original data
using eigen vectors corresponding to
selected eigenvalues
transformed_data =
np.dot(normalized_data,
selected_eigenvectors)

# Print the results

print(f"Number of components to
retain {variance_to_retain * 100}%
variance:
{num_components_to_retain}")
print("Explained variance ratio:",
selected_eigenvalues /
total_variance)

# Interpret which features inﬂuenced

the principal components the most
feature_contributions =
np.abs(selected_eigenvectors) /
np.sum(np.abs(selected_eigenvectors
), axis=0)
feature_contributions_df =
pd.DataFrame(feature_contributions,
index=columns,

columns=[f'PC{i + 1}' for i in

range(num_components_to_retain)])
print("\nFeature contributions to
Principal Components:")
print(feature_contributions_df)

Code 02

import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
from sklearn import datasets
from sklearn.decomposition import
PCA

def load_iris_data():
iris = datasets.load_iris()
data, columns = iris.data,
iris.feature_names
return pd.DataFrame(data,
columns=columns), iris.target

def display_correlation_matrix(df):
correlation_matrix = df.corr()
print("Correlation Matrix:")
print(correlation_matrix)

def normalize_features(df):
return (df - df.mean()) / df.std()

def perform_pca(data, target):

pca = PCA(n_components=0.95)
transformed_data =
pca.ﬁt_transform(data)
plot_before_after_pca(data,
transformed_data, target)
display_pca_info(pca)

display_feature_contributions(pca.co
mponents_, data.columns)

def
plot_before_after_pca(original_data,
transformed_data, target):
plt.ﬁgure(ﬁgsize=(12, 6))
# Original Data
plt.subplot(1, 2, 1)
plt.scatter(original_data.iloc[:, 0],
original_data.iloc[:, 1], c=target,
cmap='Set1')
plt.title('Original Data')
plt.xlabel('Feature 01')
plt.ylabel('Feature 02')

# Data after PCA

plt.subplot(1, 2, 2)
plt.scatter(transformed_data[:, 0],
transformed_data[:, 1], c=target,
cmap='Set1')
plt.title('Data after PCA')
plt.xlabel('Principal Component 01')
plt.ylabel('Principal Component 02')

plt.saveﬁg('output_plot.png')
plt.show()

def display_pca_info(pca):
print(f"\nNumber of components to
retain 95% variance:
{pca.n_components_}")
print("Explained variance ratio:",
pca.explained_variance_ratio_)

def
display_feature_contributions(compo
nents, columns):
feature_contributions =
np.abs(components) /
np.sum(np.abs(components), axis=1)
[:, np.newaxis]
feature_contributions_df =
pd.DataFrame(feature_contributions.T
, index=columns,

columns=[f'PC{i + 1}' for i in

range(components.shape[0])])

print("\nFeature contributions to
Principal Components:")
print(feature_contributions_df)
# Plotting the feature contributions
plt.figure(figsize=(12, 6))
for i in
range(components.shape[0]):
plt.subplot(1,
components.shape[0], i + 1)
plt.bar(columns,
feature_contributions_df.iloc[:, i])
plt.title(f'PC{i + 1} Feature
Contributions')
plt.xlabel('Original Features')
plt.ylabel('Contribution')
plt.savefig('output_plot_feature_contri
butions.png')
plt.show()

def main():
iris_data, target = load_iris_data()

display_correlation_matrix(iris_data)
normalized_data =
normalize_features(iris_data)
perform_pca(normalized_data,
target)

if __name__ == "__main__":
main()
Code 03

import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
from sklearn import datasets
from sklearn.decomposition import
PCA

# Load the Iris dataset

iris = datasets.load_iris()
data, columns = iris.data,
iris.feature_names
# Create a Pandas DataFrame from
the Iris dataset
df = pd.DataFrame(data,
columns=columns)

# Display the correlation matrix

correlation_matrix = df.corr()
print("Correlation Matrix:")
print(correlation_matrix)

# Mean normalize the features

normalized_data = (df - df.mean()) /
df.std()
# Perform PCA using Scikit-learn
pca = PCA(n_components=0.95) #
Retain 95% variance
transformed_data =
pca.ﬁt_transform(normalized_data)

# Plotting the data before and after

PCA
plt.ﬁgure(ﬁgsize=(12, 6))

# Original Data
plt.subplot(1, 2, 1)
plt.scatter(normalized_data.iloc[:, 0],
normalized_data.iloc[:, 1],
c=iris.target, cmap='Set1')
plt.title('Original Data')
plt.xlabel('Feature 01')
plt.ylabel('Feature 02')

# Data after PCA

plt.subplot(1, 2, 2)
plt.scatter(transformed_data[:, 0],
transformed_data[:, 1], c=iris.target,
cmap='Set1')
plt.title('Data after PCA')
plt.xlabel('Principal Component 01')
plt.ylabel('Principal Component 02')

plt.saveﬁg('output_plot.png')
plt.show()
# Display the number of components
and explained variance ratio
print(f"\nNumber of components to
retain 95% variance:
{pca.n_components_}")
print("Explained variance ratio:",
pca.explained_variance_ratio_)

# Interpreting which features

inﬂuenced the principal components
the most
feature_contributions =
np.abs(pca.components_) /
np.sum(np.abs(pca.components_),
axis=1)[:, np.newaxis]
feature_contributions_df =
pd.DataFrame(feature_contributions.T
, index=columns,

columns=[f'PC{i + 1}' for i in

range(pca.n_components_)])

print("\nFeature contributions to
Principal Components:")
print(feature_contributions_df)

# Plotting the feature contributions

plt.ﬁgure(ﬁgsize=(12, 6))
for i in range(pca.n_components_):
plt.subplot(1, pca.n_components_, i
+ 1)
plt.bar(columns,
feature_contributions_df.iloc[:, i])
plt.title(f'PC{i + 1} Feature
Contributions')
plt.xlabel('Original Features')
plt.ylabel('Contribution')

plt.saveﬁg('output_plot_feature_contri
butions.png')
plt.show()

Modern Big Data Algorithms
No ratings yet
Modern Big Data Algorithms
52 pages
Ame302 Chapter9 Homework Set (Arnaz)
No ratings yet
Ame302 Chapter9 Homework Set (Arnaz)
6 pages
Unit1 ML Programs
No ratings yet
Unit1 ML Programs
5 pages
Ex No 6
No ratings yet
Ex No 6
3 pages
Ass1_SetB2
No ratings yet
Ass1_SetB2
1 page
program - 3
No ratings yet
program - 3
4 pages
Stats_Lab(10-12)
No ratings yet
Stats_Lab(10-12)
4 pages
Experiment 3 Code
No ratings yet
Experiment 3 Code
2 pages
Untitled document-2-1-13-7-11.4
No ratings yet
Untitled document-2-1-13-7-11.4
5 pages
IFM GROUP2 CODE
No ratings yet
IFM GROUP2 CODE
7 pages
MACHINE LEARNING manual
No ratings yet
MACHINE LEARNING manual
36 pages
Lecture Material 3
No ratings yet
Lecture Material 3
7 pages
21b-200-SE_LW04
No ratings yet
21b-200-SE_LW04
4 pages
indexdw (1)
No ratings yet
indexdw (1)
34 pages
Lab Manual
No ratings yet
Lab Manual
7 pages
ml lab
No ratings yet
ml lab
14 pages
Data analytics assignment solutions
No ratings yet
Data analytics assignment solutions
20 pages
Decision Tree (1)
No ratings yet
Decision Tree (1)
2 pages
External
No ratings yet
External
11 pages
ml
No ratings yet
ml
23 pages
Untitled Document
No ratings yet
Untitled Document
19 pages
Week6 - Colab
No ratings yet
Week6 - Colab
3 pages
ml
No ratings yet
ml
10 pages
prac4
No ratings yet
prac4
2 pages
A2 Vishal Borra
No ratings yet
A2 Vishal Borra
2 pages
Machine Learning Pract
No ratings yet
Machine Learning Pract
7 pages
ML 1-10
No ratings yet
ML 1-10
53 pages
Python Lab Programs-23pca017 & 23pca018
No ratings yet
Python Lab Programs-23pca017 & 23pca018
8 pages
prg3
No ratings yet
prg3
2 pages
Data_Mining_Practicals_Complete
No ratings yet
Data_Mining_Practicals_Complete
13 pages
Machine Learning Lab Manual (1)
No ratings yet
Machine Learning Lab Manual (1)
2 pages
Pandas_Dataframe_All_Operations_1735471870
No ratings yet
Pandas_Dataframe_All_Operations_1735471870
4 pages
datascience pgms
No ratings yet
datascience pgms
5 pages
Introduction To Pandas in Data Analytics
No ratings yet
Introduction To Pandas in Data Analytics
12 pages
ABHAYMLFILE
No ratings yet
ABHAYMLFILE
16 pages
Abhiml ML File
No ratings yet
Abhiml ML File
74 pages
AI_ML22203009 - Assignment-10
No ratings yet
AI_ML22203009 - Assignment-10
3 pages
AML_code_for_m2
No ratings yet
AML_code_for_m2
7 pages
AI CODE
No ratings yet
AI CODE
2 pages
Unit-3 Machine Learning Model with FastAPI for Iris Dataset
No ratings yet
Unit-3 Machine Learning Model with FastAPI for Iris Dataset
3 pages
Ml Solution
No ratings yet
Ml Solution
60 pages
Raw Nitex
No ratings yet
Raw Nitex
5 pages
DWDM Lab Manual
No ratings yet
DWDM Lab Manual
32 pages
CO3
No ratings yet
CO3
8 pages
Data Exploration Preparation
No ratings yet
Data Exploration Preparation
12 pages
Experiment 1 solution
No ratings yet
Experiment 1 solution
5 pages
To Study About Numpy, Pandas and Matplotlib Libraries in Python
No ratings yet
To Study About Numpy, Pandas and Matplotlib Libraries in Python
21 pages
Lab 9
No ratings yet
Lab 9
9 pages
PR
No ratings yet
PR
17 pages
ML JOURNAL
No ratings yet
ML JOURNAL
53 pages
DMT Cia2
No ratings yet
DMT Cia2
11 pages
Utkarsh Da 5 Final
No ratings yet
Utkarsh Da 5 Final
13 pages
IDML Lab Programs
No ratings yet
IDML Lab Programs
5 pages
EDA Python Guide
No ratings yet
EDA Python Guide
11 pages
Decision Trees.
No ratings yet
Decision Trees.
1 page
Exercise 3
No ratings yet
Exercise 3
12 pages
Pramkk
No ratings yet
Pramkk
10 pages
Dev Lab Manual Org
No ratings yet
Dev Lab Manual Org
28 pages
DWDM Lab Report
No ratings yet
DWDM Lab Report
26 pages
Import Pandas As PD DF PD - Read - CSV ("Titanic - Train - CSV") DF - Head
No ratings yet
Import Pandas As PD DF PD - Read - CSV ("Titanic - Train - CSV") DF - Head
20 pages
MLSolutions
No ratings yet
MLSolutions
4 pages
The Essential R Reference
From Everand
The Essential R Reference
Mark Gardener
No ratings yet
ITNE2002-Lab5
No ratings yet
ITNE2002-Lab5
7 pages
DCS Assignment03
No ratings yet
DCS Assignment03
3 pages
ITNE2002-Lab4 -new-2
No ratings yet
ITNE2002-Lab4 -new-2
3 pages
MEM601_Assessment 2_20240603
No ratings yet
MEM601_Assessment 2_20240603
7 pages
Slide 05
No ratings yet
Slide 05
16 pages
Application Tips 2022
No ratings yet
Application Tips 2022
6 pages
Lab 02 Open Circuit Test
No ratings yet
Lab 02 Open Circuit Test
5 pages
Slide 03
No ratings yet
Slide 03
15 pages
Slide
No ratings yet
Slide
13 pages
Matrix Inversion and Eigenvalue
No ratings yet
Matrix Inversion and Eigenvalue
31 pages
IterMethBook 2nded PDF
100% (1)
IterMethBook 2nded PDF
567 pages
2 Gauss Jordan and Gaussian
No ratings yet
2 Gauss Jordan and Gaussian
26 pages
Lecture 03
No ratings yet
Lecture 03
46 pages
Assignment 2 (MAB-103)
No ratings yet
Assignment 2 (MAB-103)
2 pages
Gauss Elimination Method
No ratings yet
Gauss Elimination Method
4 pages
Appendix D The Eigenvalue Problem
No ratings yet
Appendix D The Eigenvalue Problem
7 pages
Inverse Power Method, Shifted Power Method and Deflation
No ratings yet
Inverse Power Method, Shifted Power Method and Deflation
4 pages
Matrices DPP
No ratings yet
Matrices DPP
7 pages
Chapter 3 - Matrices PDF
No ratings yet
Chapter 3 - Matrices PDF
6 pages
Linear Algebra
No ratings yet
Linear Algebra
65 pages
Sparse Matrix Technology PDF
No ratings yet
Sparse Matrix Technology PDF
45 pages
MKL 2017 Developer Reference C
No ratings yet
MKL 2017 Developer Reference C
2,496 pages
Matrices and Determinant
No ratings yet
Matrices and Determinant
180 pages
Agnes - Imam - Laporan Praktikum Numerik Gauss Dan Gauss Jordan
No ratings yet
Agnes - Imam - Laporan Praktikum Numerik Gauss Dan Gauss Jordan
10 pages
Sparse Matrices: Dr. Manmath N. Sahoo Department of CSE, NIT Rourkela
No ratings yet
Sparse Matrices: Dr. Manmath N. Sahoo Department of CSE, NIT Rourkela
18 pages
Singular Value Decomposition: Yan-Bin Jia Sep 6, 2012
No ratings yet
Singular Value Decomposition: Yan-Bin Jia Sep 6, 2012
9 pages
Tugas2 Regresi Linear Berganda - Ipynb - Colab
No ratings yet
Tugas2 Regresi Linear Berganda - Ipynb - Colab
3 pages
Yousef Saad - Iterative Methods For Sparse Linear Systems-Society For Industrial and Applied Mathematics (2003)
No ratings yet
Yousef Saad - Iterative Methods For Sparse Linear Systems-Society For Industrial and Applied Mathematics (2003)
460 pages
Linear Algebra and Its Applications 5th Edition Lay Test Bank Download
100% (22)
Linear Algebra and Its Applications 5th Edition Lay Test Bank Download
10 pages
Lec3 Numerical Model
No ratings yet
Lec3 Numerical Model
57 pages
Solution Manual Aljabar Linear
No ratings yet
Solution Manual Aljabar Linear
8 pages
Midterm Lecture Part 2
No ratings yet
Midterm Lecture Part 2
35 pages
Chapra LU Decomposition Chapter 9
No ratings yet
Chapra LU Decomposition Chapter 9
11 pages
Lec#10 Crouts and Dolittle
No ratings yet
Lec#10 Crouts and Dolittle
16 pages
Assignment_1_MTH501_Linear_Algebra (1)
No ratings yet
Assignment_1_MTH501_Linear_Algebra (1)
5 pages
TutorialMatrices2 - With Answers
No ratings yet
TutorialMatrices2 - With Answers
3 pages
Linear Algebra Cheat Sheet
No ratings yet
Linear Algebra Cheat Sheet
2 pages