0% found this document useful (0 votes)

45 views

Machine Learning Algorithms From Scratch

Uploaded by

mcs23007

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

45 views

Machine Learning Algorithms From Scratch

Uploaded by

mcs23007

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 9

LINEAR REGRESSION From Scratch:

import numpy as np
class LinearRegression():

def __init__(self,lr,n_iter):
self.lr=lr #learning rate
self.n_iter=n_iter #number_of_iteration_to_train
self.weights=None
self.bias=None

def fit_model(self,X,y):
"""to train model using gradient descent"""
n_samples,n_features=X.shape
print(n_samples,n_features)
self.weights=np.random.rand(n_features)
self.bias=0

for _ in tqdm(range(self.n_iter)):

# calculate y_predicted
y_pred=np.dot(X,self.weights)+self.bias

# Compute Gradients
delw=(1/n_samples)*np.dot(X.T,(y_pred-y))
delb=(1/n_samples)*np.sum(y_pred-y)

# update weights and bias

self.weights=self.weights-self.lr*delw
self.bias=self.bias-self.lr*delb
return

def predict(self,X):
return (np.dot(X,self.weights)+self.bias)
LOGISTIC REGRESSION From
Scratch:

class LogisticRegression():

def __init__(self,lr,n_iter):
self.lr=lr
self.n_iter=n_iter
self.weights=None
self.bias=None

def sigmoid(self,z):
return 1 / (1 + np.exp(-z))

def fit_model(self,X,y):
n_samples,n_features=X.shape

# weight bias initialization

self.weights=np.random.rand(n_features)
self.bias=0

# start training iterations

for _ in range(self.n_iter):
linear_output=np.dot(X,self.weights)+self.bias
y_pred=self.sigmoid(linear_output)

# compute gradient
delw= (1/n_samples)*np.dot(X.T, (y_pred-y))
delb= (1/n_samples)*np.sum(y_pred-y)

# update weights and bias

self.weights=self.weights-self.lr*delw
self.bias=self.bias-self.lr*delb

def predict_class(self,X):
linear_output=np.dot(X,self.weights)+self.bias
y_pred=self.sigmoid(linear_output)
y_pred_class=[1 if i>0.5 else 0 for i in y_pred]
return y_pred_class
K-Means Clustering From Scratch:
def kmeans(data, K, max_iterations=100, tolerance=1e-4):
# Randomly initialize centroids
centroids = random_initialize_centroids(data, K)
for _ in range(max_iterations):
# Assignment Step
clusters = {}
for point in data:
nearest_centroid = find_nearest_centroid(point, centroids)
if nearest_centroid in clusters:
clusters[nearest_centroid].append(point)
else:
clusters[nearest_centroid] = [point]

# Update Step
new_centroids = []
for centroid in centroids:
new_centroid = calculate_mean(clusters[centroid])
new_centroids.append(new_centroid)

# Check for convergence

if convergence(new_centroids, centroids, tolerance):
break

centroids = new_centroids

return centroids, clusters

def random_initialize_centroids(data, K):

# Randomly select K data points as initial centroids
return data[np.random.choice(data.shape[0], K, replace=False)]
def find_nearest_centroid(point, centroids):
# Calculate distances between the point and all centroids
distances = [np.linalg.norm(point - centroid) for centroid in
centroids]
# Return the centroid with the minimum distance
return centroids[np.argmin(distances)]
def calculate_mean(points):
# Calculate the mean (average) of a list of points
return np.mean(points, axis=0)

def convergence(new_centroids, old_centroids, tolerance):

# Check if centroids have converged (i.e., no significant change)
return np.max(np.abs(np.array(new_centroids) -
np.array(old_centroids))) < tolerance
Density Based Spatial Clustering of
Application with Noise(DB-SCAN):
import numpy as np

class DBSCAN:
def __init__(self, epsilon, min_points):
self.epsilon = epsilon
self.min_points = min_points
self.visited = set()

def fit(self, data):

self.data = data
self.clusters = []

for point in self.data:

if point not in self.visited:
self.visited.add(point)
neighbors = self.range_query(point)

if len(neighbors) < self.min_points:

continue

cluster = self.expand_cluster(point, neighbors)

self.clusters.append(cluster)
return self.clusters
def range_query(self, point):
neighbors = []
for q in self.data:
if np.linalg.norm(point - q) <= self.epsilon:
neighbors.append(q)
return neighbors
def expand_cluster(self, point, neighbors):
cluster = [point]

for neighbor in neighbors:

if neighbor not in self.visited:
self.visited.add(neighbor)
new_neighbors = self.range_query(neighbor)
if len(new_neighbors) >= self.min_points:
neighbors.extend(new_neighbors)
if neighbor not in [p for c in self.clusters for p in c]:
cluster.append(neighbor)

return cluster
Gradient Boost for Regression:

import numpy as np

class GradientBoostingRegression:
def __init__(self, num_iterations=100, learning_rate=0.1):
self.num_iterations = num_iterations
self.learning_rate = learning_rate
self.models = []

def fit(self, X, y):

F = np.mean(y)
for _ in range(self.num_iterations):
residuals = -(y - F)

# Train a linear regressor on the residuals (e.g., using

least squares)
weak_learner = self.train_linear_regressor(X, residuals)

prediction = weak_learner.predict(X)
F += self.learning_rate * prediction
self.models.append(weak_learner)

def train_linear_regressor(self, X, residuals):

# Implement linear regression (e.g., using numpy or scikit-
learn)
# Return the linear regressor (e.g., coefficients)
pass # Replace with your linear regression training code

def predict(self, X):

predictions = np.mean(X)*np.ones(X.shape[0])
for model in self.models:
predictions += self.learning_rate * model.predict(X)
return predictions
Ada Boost for Decision Trees:
import numpy as np

class DecisionStump:
def __init__(self):
self.feature_index = None
self.threshold = None
self.alpha = None

def fit(self, X, y, sample_weights):

num_samples, num_features = X.shape
min_error = float('inf')

for feature_index in range(num_features):

unique_thresholds = np.unique(X[:, feature_index])
for threshold in unique_thresholds:
y_pred = np.ones(num_samples)
y_pred[X[:, feature_index] < threshold] = -1

error = np.sum(sample_weights[y_pred != y])

if error < min_error:

min_error = error
self.feature_index = feature_index
self.threshold = threshold

# Calculate alpha (classifier weight)

self.alpha = 0.5 * np.log((1 - min_error) / (min_error + 1e-
10))

def predict(self, X):

num_samples = X.shape[0]
y_pred = np.ones(num_samples)
y_pred[X[:, self.feature_index] < self.threshold] = -1
return y_pred

class AdaBoost:
def __init__(self, num_iterations=50):
self.num_iterations = num_iterations
self.classifiers = []
self.alphas = []

def fit(self, X, y):

num_samples = X.shape[0]
sample_weights = np.ones(num_samples) / num_samples
for _ in range(self.num_iterations):
classifier = DecisionStump()
classifier.fit(X, y, sample_weights)

y_pred = classifier.predict(X)
weighted_error = np.sum(sample_weights[y_pred != y]) /
np.sum(sample_weights)

# Calculate classifier weight (alpha)

alpha = 0.5 * np.log((1 - weighted_error) / (weighted_error
+ 1e-10))
self.alphas.append(alpha)

# Update sample weights

sample_weights *= np.exp(-alpha * y * y_pred)
sample_weights /= np.sum(sample_weights)

self.classifiers.append(classifier)

def predict(self, X):

num_samples = X.shape[0]
final_predictions = np.zeros(num_samples)

for alpha, classifier in zip(self.alphas, self.classifiers):

final_predictions += alpha * classifier.predict(X)

return np.sign(final_predictions)

# Example usage:
if __name__ == "__main__":
# Generate synthetic data for binary classification
np.random.seed(0)
X = np.random.rand(100, 2)
y = np.where(X[:, 0] + X[:, 1] > 1, 1, -1)

# Train the AdaBoost classifier with Decision Stumps as base

learners
adaboost = AdaBoost(num_iterations=50)
adaboost.fit(X, y)

# Make predictions
X_test = np.array([[0.7, 0.3], [0.4, 0.6]])
y_pred = adaboost.predict(X_test)
print("Predicted:", y_pred)
Neural Network for binary Clf:
import numpy as np

# Define the sigmoid activation function and its derivative

def sigmoid(x):
return 1 / (1 + np.exp(-x))

def sigmoid_derivative(x):
return x * (1 - x)

class NeuralNetwork:
def __init__(self, input_size, hidden_size, output_size,
learning_rate=0.1):
# Initialize network architecture and hyperparameters
self.input_size = input_size
self.hidden_size = hidden_size
self.output_size = output_size
self.learning_rate = learning_rate

# Initialize weights and biases with random values

self.weights_input_hidden = np.random.randn(self.input_size,
self.hidden_size)
self.bias_hidden = np.zeros((1, self.hidden_size))
self.weights_hidden_output = np.random.randn(self.hidden_size,
self.output_size)
self.bias_output = np.zeros((1, self.output_size))

def forward(self, X):

# Forward propagation through the network
self.hidden_input = np.dot(X, self.weights_input_hidden) +
self.bias_hidden
self.hidden_output = sigmoid(self.hidden_input)
self.output_input = np.dot(self.hidden_output,
self.weights_hidden_output) + self.bias_output
self.predicted_output = sigmoid(self.output_input)
return self.predicted_output
def backward(self, X, y):
# Backpropagation and weight updates
error = y - self.predicted_output

# Calculate gradients
delta_output = error *
sigmoid_derivative(self.predicted_output)
d_weights_hidden_output = np.dot(self.hidden_output.T,
delta_output)
delta_hidden = np.dot(delta_output,
self.weights_hidden_output.T) * sigmoid_derivative(self.hidden_output)
d_weights_input_hidden = np.dot(X.T, delta_hidden)

# Update weights and biases

self.weights_hidden_output += self.learning_rate *
d_weights_hidden_output
self.bias_output += self.learning_rate * np.sum(delta_output,
axis=0)
self.weights_input_hidden += self.learning_rate *
d_weights_input_hidden
self.bias_hidden += self.learning_rate * np.sum(delta_hidden,
axis=0)
def train(self, X, y, epochs):
for epoch in range(epochs):
# Forward and backward pass for each data point
for i in range(len(X)):
input_data = X[i].reshape(1, -1)
target_output = y[i].reshape(1, -1)
predicted_output = self.forward(input_data)
self.backward(input_data, target_output)

# Calculate and print the mean squared error for this epoch
mse = np.mean(np.square(y - self.predict(X)))
print(f"Epoch {epoch + 1}/{epochs}, Mean Squared Error:
{mse:.4f}")
# Example usage:
if __name__ == "__main__":
# Generate synthetic data for binary classification
np.random.seed(0)
X = np.random.rand(100, 2)
y = np.where(X[:, 0] + X[:, 1] > 1, 1, 0)

# Define and train the neural network

input_size = 2
hidden_size = 4
output_size = 1
learning_rate = 0.1
epochs = 1000

nn = NeuralNetwork(input_size, hidden_size, output_size,

learning_rate)
nn.train(X, y, epochs)
# Make predictions
X_test = np.array([[0.7, 0.3], [0.4, 0.6]])
predictions = nn.forward(X_test)
print("Predicted:", predictions)

Prova de Inglês - Across - Passei Direto
100% (2)
Prova de Inglês - Across - Passei Direto
5 pages
Javascriptgrammar II PDF
67% (3)
Javascriptgrammar II PDF
246 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
ai int-1
No ratings yet
ai int-1
6 pages
Advance AI and ML LAB
No ratings yet
Advance AI and ML LAB
16 pages
Machine Learning LAB
No ratings yet
Machine Learning LAB
20 pages
DM ML Practical
No ratings yet
DM ML Practical
13 pages
LAB-4 Report
No ratings yet
LAB-4 Report
21 pages
DOC-20241108-WA0003
No ratings yet
DOC-20241108-WA0003
16 pages
Unit2 ML Programs
No ratings yet
Unit2 ML Programs
7 pages
ML Lab
No ratings yet
ML Lab
7 pages
Ai Last 5
No ratings yet
Ai Last 5
4 pages
Minor_lab
No ratings yet
Minor_lab
4 pages
Soft Computing
No ratings yet
Soft Computing
16 pages
Experiment 2
No ratings yet
Experiment 2
15 pages
Sofcomputing Da2
No ratings yet
Sofcomputing Da2
7 pages
ANN PR Code and Output
No ratings yet
ANN PR Code and Output
25 pages
ANN_EXPERIENTIAL_LEARNING
No ratings yet
ANN_EXPERIENTIAL_LEARNING
43 pages
perceptron-numpy
No ratings yet
perceptron-numpy
3 pages
Pdf
No ratings yet
Pdf
41 pages
AIML Lab Prog
No ratings yet
AIML Lab Prog
15 pages
AI Lab M.Tech
No ratings yet
AI Lab M.Tech
29 pages
Programs Lab Bca
No ratings yet
Programs Lab Bca
16 pages
ML Record Print
No ratings yet
ML Record Print
20 pages
Exe 1
No ratings yet
Exe 1
13 pages
21bit0706 VL2024250106861 Da
No ratings yet
21bit0706 VL2024250106861 Da
7 pages
AI LAB
No ratings yet
AI LAB
19 pages
MLDA3
No ratings yet
MLDA3
9 pages
MLLabManual
No ratings yet
MLLabManual
24 pages
Lab-5 Report
No ratings yet
Lab-5 Report
11 pages
machine learning final manual
No ratings yet
machine learning final manual
45 pages
Experiment No
No ratings yet
Experiment No
29 pages
ML
No ratings yet
ML
7 pages
Mlda - Lab
No ratings yet
Mlda - Lab
35 pages
Implementing KNN Algorithm on the Iris Dataset
No ratings yet
Implementing KNN Algorithm on the Iris Dataset
7 pages
Aiml Lab
No ratings yet
Aiml Lab
14 pages
Week6_Bai
No ratings yet
Week6_Bai
14 pages
ML Lab PT
No ratings yet
ML Lab PT
25 pages
EE 559 HW2Code PDF
No ratings yet
EE 559 HW2Code PDF
7 pages
Udacity Machine Learning Analysis Supervised Learning
100% (1)
Udacity Machine Learning Analysis Supervised Learning
504 pages
Deep-Learning-Keras-Tensorflow - 1.1.1 Perceptron and Adaline - Ipynb at Master Leriomaggio - Deep-Learning-Keras-Tensorflow
No ratings yet
Deep-Learning-Keras-Tensorflow - 1.1.1 Perceptron and Adaline - Ipynb at Master Leriomaggio - Deep-Learning-Keras-Tensorflow
11 pages
Experiment1111
No ratings yet
Experiment1111
25 pages
SC - LAB
No ratings yet
SC - LAB
22 pages
1st PGM
No ratings yet
1st PGM
10 pages
AML Programs
No ratings yet
AML Programs
13 pages
AI
No ratings yet
AI
11 pages
ml lab
No ratings yet
ml lab
23 pages
Setup: This Notebook Contains All The Sample Code and Solutions To The Exercises in Chapter 3
No ratings yet
Setup: This Notebook Contains All The Sample Code and Solutions To The Exercises in Chapter 3
30 pages
Aiml 5-8
No ratings yet
Aiml 5-8
19 pages
ML Lab Experiments (1) - Pages-5
No ratings yet
ML Lab Experiments (1) - Pages-5
8 pages
Software Laboratory II Code
No ratings yet
Software Laboratory II Code
27 pages
Báo Cáo Java 4
No ratings yet
Báo Cáo Java 4
3 pages
Adaptive Linear Neuron Using Linear (Identity) Activation Function With Batch Gradient Method
No ratings yet
Adaptive Linear Neuron Using Linear (Identity) Activation Function With Batch Gradient Method
19 pages
Vertopal.com Experiment01 Baseline Models Accuracy
No ratings yet
Vertopal.com Experiment01 Baseline Models Accuracy
35 pages
ML LAB
No ratings yet
ML LAB
23 pages
Bilal Ahmad Ai & DSS Assign # 03
No ratings yet
Bilal Ahmad Ai & DSS Assign # 03
7 pages
Naive Bayes
No ratings yet
Naive Bayes
58 pages
Machine Learning Lab
No ratings yet
Machine Learning Lab
13 pages
Linearregression SVM
No ratings yet
Linearregression SVM
3 pages
6 Task RBF
No ratings yet
6 Task RBF
6 pages
Case Study - Classifier
No ratings yet
Case Study - Classifier
5 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Year 10 - Number and Algebra - Pre Victorian Curriculum Assessment - 9.5 11 - Sample
No ratings yet
Year 10 - Number and Algebra - Pre Victorian Curriculum Assessment - 9.5 11 - Sample
12 pages
Terrain Below Ground Drainage Dimensional Data
No ratings yet
Terrain Below Ground Drainage Dimensional Data
16 pages
Delhi School of Economics Past Year Paper
No ratings yet
Delhi School of Economics Past Year Paper
3 pages
GNSS PDF
No ratings yet
GNSS PDF
39 pages
B16-25 Edtn 2007 PDF
No ratings yet
B16-25 Edtn 2007 PDF
30 pages
Gender As An Occupation The Role of OT in The Transgender Community
No ratings yet
Gender As An Occupation The Role of OT in The Transgender Community
115 pages
SLSLX-6RS Series Installation Guide
No ratings yet
SLSLX-6RS Series Installation Guide
30 pages
Logic Valves PDF
No ratings yet
Logic Valves PDF
7 pages
ICT Policies and Safety Issues in Teaching and Learning
No ratings yet
ICT Policies and Safety Issues in Teaching and Learning
3 pages
AUTOSAR CP SWS CommunicationStackTypes
No ratings yet
AUTOSAR CP SWS CommunicationStackTypes
26 pages
How To Use JCreator LE
No ratings yet
How To Use JCreator LE
15 pages
793F Plano Hidraulico
No ratings yet
793F Plano Hidraulico
10 pages
Sitharam and Sil 2014
No ratings yet
Sitharam and Sil 2014
21 pages
Lesson Plan - Grand Opening - YLE
No ratings yet
Lesson Plan - Grand Opening - YLE
4 pages
Civics 7TH
No ratings yet
Civics 7TH
1 page
Piping Interview Questions
100% (7)
Piping Interview Questions
17 pages
How The Starting System Works - Blog - Teknisi
No ratings yet
How The Starting System Works - Blog - Teknisi
24 pages
All Assets.2020 07 29
No ratings yet
All Assets.2020 07 29
1,938 pages
Fe Sharp Npcatalog 2005
No ratings yet
Fe Sharp Npcatalog 2005
98 pages
Cartridge Cavity ISO 7789-18-01-0-98: 2-Way-Cavity For General Function (Without Pressure Relief)
No ratings yet
Cartridge Cavity ISO 7789-18-01-0-98: 2-Way-Cavity For General Function (Without Pressure Relief)
1 page
A New Measure of Disclosure Quality - The Level of Disaggregation of Accounting Data in Annual Reports
No ratings yet
A New Measure of Disclosure Quality - The Level of Disaggregation of Accounting Data in Annual Reports
38 pages
CRT Picture Tube
No ratings yet
CRT Picture Tube
5 pages
IS323 Final Exam 2012 (Sem 1)
No ratings yet
IS323 Final Exam 2012 (Sem 1)
12 pages
Five Central Cognitive Processes in IL Development
No ratings yet
Five Central Cognitive Processes in IL Development
3 pages
HMI-S Data Sheet 20200424
No ratings yet
HMI-S Data Sheet 20200424
2 pages
LAP Amity Noida
No ratings yet
LAP Amity Noida
19 pages
MSA Explosimeter Certificate 2019 PDF
No ratings yet
MSA Explosimeter Certificate 2019 PDF
1 page
John Doe Reflection Paper
No ratings yet
John Doe Reflection Paper
3 pages

Machine Learning Algorithms From Scratch

Uploaded by

Machine Learning Algorithms From Scratch

Uploaded by

LINEAR REGRESSION From Scratch:

# update weights and bias

# weight bias initialization

# start training iterations

# update weights and bias

# Check for convergence

return centroids, clusters

def random_initialize_centroids(data, K):

def convergence(new_centroids, old_centroids, tolerance):

def fit(self, data):

for point in self.data:

if len(neighbors) < self.min_points:

cluster = self.expand_cluster(point, neighbors)

for neighbor in neighbors:

def fit(self, X, y):

# Train a linear regressor on the residuals (e.g., using

def train_linear_regressor(self, X, residuals):

def predict(self, X):

def fit(self, X, y, sample_weights):

for feature_index in range(num_features):

error = np.sum(sample_weights[y_pred != y])

if error < min_error:

# Calculate alpha (classifier weight)

def predict(self, X):

def fit(self, X, y):

# Calculate classifier weight (alpha)

# Update sample weights

def predict(self, X):

for alpha, classifier in zip(self.alphas, self.classifiers):

# Train the AdaBoost classifier with Decision Stumps as base

# Define the sigmoid activation function and its derivative

# Initialize weights and biases with random values

def forward(self, X):

# Update weights and biases

# Define and train the neural network

nn = NeuralNetwork(input_size, hidden_size, output_size,

You might also like