0% found this document useful (0 votes)

33 views

Machine Learning Algorithms From Scratch

Uploaded by

mcs23007

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

33 views

Machine Learning Algorithms From Scratch

Uploaded by

mcs23007

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 9

LINEAR REGRESSION From Scratch:

import numpy as np
class LinearRegression():

def __init__(self,lr,n_iter):
self.lr=lr #learning rate
self.n_iter=n_iter #number_of_iteration_to_train
self.weights=None
self.bias=None

def fit_model(self,X,y):
"""to train model using gradient descent"""
n_samples,n_features=X.shape
print(n_samples,n_features)
self.weights=np.random.rand(n_features)
self.bias=0

for _ in tqdm(range(self.n_iter)):

# calculate y_predicted
y_pred=np.dot(X,self.weights)+self.bias

# Compute Gradients
delw=(1/n_samples)*np.dot(X.T,(y_pred-y))
delb=(1/n_samples)*np.sum(y_pred-y)

# update weights and bias

self.weights=self.weights-self.lr*delw
self.bias=self.bias-self.lr*delb
return

def predict(self,X):
return (np.dot(X,self.weights)+self.bias)
LOGISTIC REGRESSION From
Scratch:

class LogisticRegression():

def __init__(self,lr,n_iter):
self.lr=lr
self.n_iter=n_iter
self.weights=None
self.bias=None

def sigmoid(self,z):
return 1 / (1 + np.exp(-z))

def fit_model(self,X,y):
n_samples,n_features=X.shape

# weight bias initialization

self.weights=np.random.rand(n_features)
self.bias=0

# start training iterations

for _ in range(self.n_iter):
linear_output=np.dot(X,self.weights)+self.bias
y_pred=self.sigmoid(linear_output)

# compute gradient
delw= (1/n_samples)*np.dot(X.T, (y_pred-y))
delb= (1/n_samples)*np.sum(y_pred-y)

# update weights and bias

self.weights=self.weights-self.lr*delw
self.bias=self.bias-self.lr*delb

def predict_class(self,X):
linear_output=np.dot(X,self.weights)+self.bias
y_pred=self.sigmoid(linear_output)
y_pred_class=[1 if i>0.5 else 0 for i in y_pred]
return y_pred_class
K-Means Clustering From Scratch:
def kmeans(data, K, max_iterations=100, tolerance=1e-4):
# Randomly initialize centroids
centroids = random_initialize_centroids(data, K)
for _ in range(max_iterations):
# Assignment Step
clusters = {}
for point in data:
nearest_centroid = find_nearest_centroid(point, centroids)
if nearest_centroid in clusters:
clusters[nearest_centroid].append(point)
else:
clusters[nearest_centroid] = [point]

# Update Step
new_centroids = []
for centroid in centroids:
new_centroid = calculate_mean(clusters[centroid])
new_centroids.append(new_centroid)

# Check for convergence

if convergence(new_centroids, centroids, tolerance):
break

centroids = new_centroids

return centroids, clusters

def random_initialize_centroids(data, K):

# Randomly select K data points as initial centroids
return data[np.random.choice(data.shape[0], K, replace=False)]
def find_nearest_centroid(point, centroids):
# Calculate distances between the point and all centroids
distances = [np.linalg.norm(point - centroid) for centroid in
centroids]
# Return the centroid with the minimum distance
return centroids[np.argmin(distances)]
def calculate_mean(points):
# Calculate the mean (average) of a list of points
return np.mean(points, axis=0)

def convergence(new_centroids, old_centroids, tolerance):

# Check if centroids have converged (i.e., no significant change)
return np.max(np.abs(np.array(new_centroids) -
np.array(old_centroids))) < tolerance
Density Based Spatial Clustering of
Application with Noise(DB-SCAN):
import numpy as np

class DBSCAN:
def __init__(self, epsilon, min_points):
self.epsilon = epsilon
self.min_points = min_points
self.visited = set()

def fit(self, data):

self.data = data
self.clusters = []

for point in self.data:

if point not in self.visited:
self.visited.add(point)
neighbors = self.range_query(point)

if len(neighbors) < self.min_points:

continue

cluster = self.expand_cluster(point, neighbors)

self.clusters.append(cluster)
return self.clusters
def range_query(self, point):
neighbors = []
for q in self.data:
if np.linalg.norm(point - q) <= self.epsilon:
neighbors.append(q)
return neighbors
def expand_cluster(self, point, neighbors):
cluster = [point]

for neighbor in neighbors:

if neighbor not in self.visited:
self.visited.add(neighbor)
new_neighbors = self.range_query(neighbor)
if len(new_neighbors) >= self.min_points:
neighbors.extend(new_neighbors)
if neighbor not in [p for c in self.clusters for p in c]:
cluster.append(neighbor)

return cluster
Gradient Boost for Regression:

import numpy as np

class GradientBoostingRegression:
def __init__(self, num_iterations=100, learning_rate=0.1):
self.num_iterations = num_iterations
self.learning_rate = learning_rate
self.models = []

def fit(self, X, y):

F = np.mean(y)
for _ in range(self.num_iterations):
residuals = -(y - F)

# Train a linear regressor on the residuals (e.g., using

least squares)
weak_learner = self.train_linear_regressor(X, residuals)

prediction = weak_learner.predict(X)
F += self.learning_rate * prediction
self.models.append(weak_learner)

def train_linear_regressor(self, X, residuals):

# Implement linear regression (e.g., using numpy or scikit-
learn)
# Return the linear regressor (e.g., coefficients)
pass # Replace with your linear regression training code

def predict(self, X):

predictions = np.mean(X)*np.ones(X.shape[0])
for model in self.models:
predictions += self.learning_rate * model.predict(X)
return predictions
Ada Boost for Decision Trees:
import numpy as np

class DecisionStump:
def __init__(self):
self.feature_index = None
self.threshold = None
self.alpha = None

def fit(self, X, y, sample_weights):

num_samples, num_features = X.shape
min_error = float('inf')

for feature_index in range(num_features):

unique_thresholds = np.unique(X[:, feature_index])
for threshold in unique_thresholds:
y_pred = np.ones(num_samples)
y_pred[X[:, feature_index] < threshold] = -1

error = np.sum(sample_weights[y_pred != y])

if error < min_error:

min_error = error
self.feature_index = feature_index
self.threshold = threshold

# Calculate alpha (classifier weight)

self.alpha = 0.5 * np.log((1 - min_error) / (min_error + 1e-
10))

def predict(self, X):

num_samples = X.shape[0]
y_pred = np.ones(num_samples)
y_pred[X[:, self.feature_index] < self.threshold] = -1
return y_pred

class AdaBoost:
def __init__(self, num_iterations=50):
self.num_iterations = num_iterations
self.classifiers = []
self.alphas = []

def fit(self, X, y):

num_samples = X.shape[0]
sample_weights = np.ones(num_samples) / num_samples
for _ in range(self.num_iterations):
classifier = DecisionStump()
classifier.fit(X, y, sample_weights)

y_pred = classifier.predict(X)
weighted_error = np.sum(sample_weights[y_pred != y]) /
np.sum(sample_weights)

# Calculate classifier weight (alpha)

alpha = 0.5 * np.log((1 - weighted_error) / (weighted_error
+ 1e-10))
self.alphas.append(alpha)

# Update sample weights

sample_weights *= np.exp(-alpha * y * y_pred)
sample_weights /= np.sum(sample_weights)

self.classifiers.append(classifier)

def predict(self, X):

num_samples = X.shape[0]
final_predictions = np.zeros(num_samples)

for alpha, classifier in zip(self.alphas, self.classifiers):

final_predictions += alpha * classifier.predict(X)

return np.sign(final_predictions)

# Example usage:
if __name__ == "__main__":
# Generate synthetic data for binary classification
np.random.seed(0)
X = np.random.rand(100, 2)
y = np.where(X[:, 0] + X[:, 1] > 1, 1, -1)

# Train the AdaBoost classifier with Decision Stumps as base

learners
adaboost = AdaBoost(num_iterations=50)
adaboost.fit(X, y)

# Make predictions
X_test = np.array([[0.7, 0.3], [0.4, 0.6]])
y_pred = adaboost.predict(X_test)
print("Predicted:", y_pred)
Neural Network for binary Clf:
import numpy as np

# Define the sigmoid activation function and its derivative

def sigmoid(x):
return 1 / (1 + np.exp(-x))

def sigmoid_derivative(x):
return x * (1 - x)

class NeuralNetwork:
def __init__(self, input_size, hidden_size, output_size,
learning_rate=0.1):
# Initialize network architecture and hyperparameters
self.input_size = input_size
self.hidden_size = hidden_size
self.output_size = output_size
self.learning_rate = learning_rate

# Initialize weights and biases with random values

self.weights_input_hidden = np.random.randn(self.input_size,
self.hidden_size)
self.bias_hidden = np.zeros((1, self.hidden_size))
self.weights_hidden_output = np.random.randn(self.hidden_size,
self.output_size)
self.bias_output = np.zeros((1, self.output_size))

def forward(self, X):

# Forward propagation through the network
self.hidden_input = np.dot(X, self.weights_input_hidden) +
self.bias_hidden
self.hidden_output = sigmoid(self.hidden_input)
self.output_input = np.dot(self.hidden_output,
self.weights_hidden_output) + self.bias_output
self.predicted_output = sigmoid(self.output_input)
return self.predicted_output
def backward(self, X, y):
# Backpropagation and weight updates
error = y - self.predicted_output

# Calculate gradients
delta_output = error *
sigmoid_derivative(self.predicted_output)
d_weights_hidden_output = np.dot(self.hidden_output.T,
delta_output)
delta_hidden = np.dot(delta_output,
self.weights_hidden_output.T) * sigmoid_derivative(self.hidden_output)
d_weights_input_hidden = np.dot(X.T, delta_hidden)

# Update weights and biases

self.weights_hidden_output += self.learning_rate *
d_weights_hidden_output
self.bias_output += self.learning_rate * np.sum(delta_output,
axis=0)
self.weights_input_hidden += self.learning_rate *
d_weights_input_hidden
self.bias_hidden += self.learning_rate * np.sum(delta_hidden,
axis=0)
def train(self, X, y, epochs):
for epoch in range(epochs):
# Forward and backward pass for each data point
for i in range(len(X)):
input_data = X[i].reshape(1, -1)
target_output = y[i].reshape(1, -1)
predicted_output = self.forward(input_data)
self.backward(input_data, target_output)

# Calculate and print the mean squared error for this epoch
mse = np.mean(np.square(y - self.predict(X)))
print(f"Epoch {epoch + 1}/{epochs}, Mean Squared Error:
{mse:.4f}")
# Example usage:
if __name__ == "__main__":
# Generate synthetic data for binary classification
np.random.seed(0)
X = np.random.rand(100, 2)
y = np.where(X[:, 0] + X[:, 1] > 1, 1, 0)

# Define and train the neural network

input_size = 2
hidden_size = 4
output_size = 1
learning_rate = 0.1
epochs = 1000

nn = NeuralNetwork(input_size, hidden_size, output_size,

learning_rate)
nn.train(X, y, epochs)
# Make predictions
X_test = np.array([[0.7, 0.3], [0.4, 0.6]])
predictions = nn.forward(X_test)
print("Predicted:", predictions)

Intelligent Digital Operations Center WP
No ratings yet
Intelligent Digital Operations Center WP
14 pages
031 42r-08 Risk Analysis and Contingency Determination Using Prametric Estimating
100% (1)
031 42r-08 Risk Analysis and Contingency Determination Using Prametric Estimating
18 pages
Agroconsultant: Intelligent Crop Recommendation System Using Machine Learning Algorithms
No ratings yet
Agroconsultant: Intelligent Crop Recommendation System Using Machine Learning Algorithms
6 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
ai int-1
No ratings yet
ai int-1
6 pages
Advance AI and ML LAB
No ratings yet
Advance AI and ML LAB
16 pages
Machine Learning LAB
No ratings yet
Machine Learning LAB
20 pages
DM ML Practical
No ratings yet
DM ML Practical
13 pages
LAB-4 Report
No ratings yet
LAB-4 Report
21 pages
Unit2 ML Programs
No ratings yet
Unit2 ML Programs
7 pages
DOC-20241108-WA0003
No ratings yet
DOC-20241108-WA0003
16 pages
ML Lab
No ratings yet
ML Lab
7 pages
Ai Last 5
No ratings yet
Ai Last 5
4 pages
Minor_lab
No ratings yet
Minor_lab
4 pages
Soft Computing
No ratings yet
Soft Computing
16 pages
Experiment 2
No ratings yet
Experiment 2
15 pages
Sofcomputing Da2
No ratings yet
Sofcomputing Da2
7 pages
ANN PR Code and Output
No ratings yet
ANN PR Code and Output
25 pages
ANN_EXPERIENTIAL_LEARNING
No ratings yet
ANN_EXPERIENTIAL_LEARNING
43 pages
perceptron-numpy
No ratings yet
perceptron-numpy
3 pages
Pdf
No ratings yet
Pdf
41 pages
AIML Lab Prog
No ratings yet
AIML Lab Prog
15 pages
AI Lab M.Tech
No ratings yet
AI Lab M.Tech
29 pages
Programs Lab Bca
No ratings yet
Programs Lab Bca
16 pages
ML Record Print
No ratings yet
ML Record Print
20 pages
Exe 1
No ratings yet
Exe 1
13 pages
21bit0706 VL2024250106861 Da
No ratings yet
21bit0706 VL2024250106861 Da
7 pages
AI LAB
No ratings yet
AI LAB
19 pages
MLDA3
No ratings yet
MLDA3
9 pages
Lab-5 Report
No ratings yet
Lab-5 Report
11 pages
machine learning final manual
No ratings yet
machine learning final manual
45 pages
MLLabManual
No ratings yet
MLLabManual
24 pages
Experiment No
No ratings yet
Experiment No
29 pages
Mlda - Lab
No ratings yet
Mlda - Lab
35 pages
ML
No ratings yet
ML
7 pages
Aiml Lab
No ratings yet
Aiml Lab
14 pages
Implementing KNN Algorithm on the Iris Dataset
No ratings yet
Implementing KNN Algorithm on the Iris Dataset
7 pages
Week6_Bai
No ratings yet
Week6_Bai
14 pages
ML Lab PT
No ratings yet
ML Lab PT
25 pages
EE 559 HW2Code PDF
No ratings yet
EE 559 HW2Code PDF
7 pages
Udacity Machine Learning Analysis Supervised Learning
100% (1)
Udacity Machine Learning Analysis Supervised Learning
504 pages
Deep-Learning-Keras-Tensorflow - 1.1.1 Perceptron and Adaline - Ipynb at Master Leriomaggio - Deep-Learning-Keras-Tensorflow
No ratings yet
Deep-Learning-Keras-Tensorflow - 1.1.1 Perceptron and Adaline - Ipynb at Master Leriomaggio - Deep-Learning-Keras-Tensorflow
11 pages
Experiment1111
No ratings yet
Experiment1111
25 pages
SC - LAB
No ratings yet
SC - LAB
22 pages
1st PGM
No ratings yet
1st PGM
10 pages
AML Programs
No ratings yet
AML Programs
13 pages
AI
No ratings yet
AI
11 pages
ml lab
No ratings yet
ml lab
23 pages
Setup: This Notebook Contains All The Sample Code and Solutions To The Exercises in Chapter 3
No ratings yet
Setup: This Notebook Contains All The Sample Code and Solutions To The Exercises in Chapter 3
30 pages
Aiml 5-8
No ratings yet
Aiml 5-8
19 pages
ML Lab Experiments (1) - Pages-5
No ratings yet
ML Lab Experiments (1) - Pages-5
8 pages
Software Laboratory II Code
No ratings yet
Software Laboratory II Code
27 pages
Báo Cáo Java 4
No ratings yet
Báo Cáo Java 4
3 pages
Adaptive Linear Neuron Using Linear (Identity) Activation Function With Batch Gradient Method
No ratings yet
Adaptive Linear Neuron Using Linear (Identity) Activation Function With Batch Gradient Method
19 pages
Vertopal.com Experiment01 Baseline Models Accuracy
No ratings yet
Vertopal.com Experiment01 Baseline Models Accuracy
35 pages
Bilal Ahmad Ai & DSS Assign # 03
No ratings yet
Bilal Ahmad Ai & DSS Assign # 03
7 pages
Naive Bayes
No ratings yet
Naive Bayes
58 pages
Machine Learning Lab
No ratings yet
Machine Learning Lab
13 pages
Linearregression SVM
No ratings yet
Linearregression SVM
3 pages
6 Task RBF
No ratings yet
6 Task RBF
6 pages
Case Study - Classifier
No ratings yet
Case Study - Classifier
5 pages
AI Lab10
No ratings yet
AI Lab10
4 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
A Hybrid Approach From Ant Colony Optimization and K-Neare
No ratings yet
A Hybrid Approach From Ant Colony Optimization and K-Neare
13 pages
Get Syllabus PDF
No ratings yet
Get Syllabus PDF
3 pages
Arti PDF
0% (1)
Arti PDF
258 pages
CNN3 Pooling and Fully Contected Layers
No ratings yet
CNN3 Pooling and Fully Contected Layers
21 pages
Project Report Undergraduate
No ratings yet
Project Report Undergraduate
95 pages
A Hybrid CNN-LSTM: A Deep Learning Approach For Consumer Sentiment Analysis Using Qualitative User-Generated Contents
No ratings yet
A Hybrid CNN-LSTM: A Deep Learning Approach For Consumer Sentiment Analysis Using Qualitative User-Generated Contents
15 pages
Rotten Fruit Vegetable Detector Machine
No ratings yet
Rotten Fruit Vegetable Detector Machine
71 pages
Research Article: Automatic Detection Algorithm of Football Events in Videos
No ratings yet
Research Article: Automatic Detection Algorithm of Football Events in Videos
13 pages
Accenture The Power of Data Driven Asset Management
No ratings yet
Accenture The Power of Data Driven Asset Management
31 pages
Alam Et Al. - 2021 - A Review of Bangla Natural Language Processing Tas
No ratings yet
Alam Et Al. - 2021 - A Review of Bangla Natural Language Processing Tas
48 pages
pattern Recognition_Unit_1&2
100% (1)
pattern Recognition_Unit_1&2
41 pages
Ann Assignmeent 1,2,3
No ratings yet
Ann Assignmeent 1,2,3
23 pages
Unit No: 4 Basics of Feature Engineering (31707 24)
No ratings yet
Unit No: 4 Basics of Feature Engineering (31707 24)
98 pages
Vit Mca 29-08-2023 PDF
No ratings yet
Vit Mca 29-08-2023 PDF
19 pages
unit-5-DL
No ratings yet
unit-5-DL
23 pages
Researchfinal
No ratings yet
Researchfinal
27 pages
ML Unit-Iv
No ratings yet
ML Unit-Iv
18 pages
Precision Agriculture Using IoT Data Analytics and Machine Learning
No ratings yet
Precision Agriculture Using IoT Data Analytics and Machine Learning
31 pages
L10 - Intro - To - Deep - Learning
No ratings yet
L10 - Intro - To - Deep - Learning
75 pages
Crop Management System Using Machine Learning
No ratings yet
Crop Management System Using Machine Learning
3 pages
JNTUK R20 B.tech CSE 3-2 Machine Learning Unit 2 Notes
No ratings yet
JNTUK R20 B.tech CSE 3-2 Machine Learning Unit 2 Notes
33 pages
Garbage Content Estimation Using Internet of Things and Machine Learning
No ratings yet
Garbage Content Estimation Using Internet of Things and Machine Learning
13 pages
Interfețe Vizuale Om-Mașină (5
No ratings yet
Interfețe Vizuale Om-Mașină (5
9 pages
Linear Regression Homework
100% (1)
Linear Regression Homework
5 pages
21BCS9861 - Abhishek Kumar Singh
No ratings yet
21BCS9861 - Abhishek Kumar Singh
1 page
(Week 4) - Balance DataSet
No ratings yet
(Week 4) - Balance DataSet
5 pages
AI ( X ) PRACTICE PAPER 1
0% (1)
AI ( X ) PRACTICE PAPER 1
5 pages