0% found this document useful (0 votes)

17 views9 pages

Mlee Lab1

The document contains Python code for implementing various gradient descent algorithms (batch, stochastic, and mini-batch) for linear regression using a dataset loaded from a CSV file. It includes functions for calculating cost, mean absolute error, mean square error, correlation coefficient, and R-squared value, along with data normalization and splitting into training and testing sets. The code visualizes the cost over iterations and compares predicted outputs against actual outputs using various metrics.

Uploaded by

f20220250

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

17 views9 pages

Mlee Lab1

Uploaded by

f20220250

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 9

from google.

colab import drive

filepath='/content/drive/MyDrive/data.csv'

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

data=pd.read_csv(filepath)

from re import X
X=data.iloc[:,:-1].values
y=data.iloc[:,-1].values

def cost_function(X,y,w):
hypothesis = np.dot(X,w.T)
J = (1/(2*len(y)))*np.sum((hypothesis-y)**2)
return J

def batch_gradient_descent(X,y,w,alpha,iters):
cost_history = np.zeros(iters)
for i in range(iters):
hypothesis = np.dot(X,w.T)
w = w - (alpha/len(y)) * np.dot(hypothesis - y, X)
cost_history[i] = cost_function(X,y,w)
return w, cost_history

def stochastic_gradient_descent(X,y,w,alpha, iters):

cost_history = np.zeros(iters)
for i in range(iters):
rand_index = np.random.randint(len(y)-1)

ind_x = X[rand_index:rand_index+1]
ind_y = y[rand_index:rand_index+1]
w = w- alpha * np.dot((np.dot(ind_x,w.T) - ind_y), ind_x)
cost_history[i] = cost_function(ind_x,ind_y,w)
return w, cost_history

def MB_gradient_descent(X,y,w,alpha, iters, batch_size):

cost_history = np.zeros(iters)
for i in range(iters):
rand_index = np.random.randint(len(y)-batch_size)
ind_x = X[rand_index:rand_index+batch_size]
ind_y = y[rand_index:rand_index+batch_size]
w = w - (alpha/batch_size) * (ind_x.T.dot(ind_x.dot(w) -
ind_y))
cost_history[i] = cost_function(ind_x,ind_y,w)
return w, cost_history

def mean_abs_error(Ypred,Yact):
sum_error=abs(Yact - Ypred)
ma_error=sum(sum_error)/Ypred.shape[0]
return ma_error

def mean_square_error(Ypred,Yact):
for i in range(Ypred.shape[0]):
sum_error=(Yact - Ypred)**2
ms_error=sum(sum_error)/Ypred.shape[0]
return ms_error

def r_squared(y_true, y_pred):

ss_total = np.sum((y_true - np.mean(y_true)) ** 2)
ss_residual = np.sum((y_true - y_pred) ** 2)
return 1 - (ss_residual / ss_total)

def correcoff(Ypred,Yact):
ypm=np.mean(Ypred)##mean of Ypred data
yam=np.mean(Yact)##mean of Yactual data
sum_numerator=((Yact - yam)*(Ypred-ypm))
sum_d1=((Yact - yam)**2)
sum_d2=((Ypred - ypm)**2)
sum_d1=pow(sum(sum_d1),1/2)
sum_d2=pow(sum(sum_d2),1/2)
th_error=sum(sum_numerator)/(sum_d1*sum_d2)
return th_error

X = data.iloc[:, :-1] # All rows, all columns except the last

y = data.iloc[:, -1]

X=np.asarray(X)
y=np.asarray(y)

m=X.shape[0]
xmin=np.min(X,axis=0)
xmax=np.max(X,axis=0)
X_normalized= (X-xmin)/(xmax-xmin)

ymin = np.min(y, axis = 0)

ymax = np.max(y, axis = 0)
y_normalized = (y- ymin)/(ymax-ymin)

m=X_normalized.shape[0]
pp=np.ones([m,1])
X_normalized=np.append(pp,X_normalized,axis=1)

train_percentage = 0.70
train_size = int(len(X) * train_percentage)
# split the data into training and testing
X_train = X_normalized[:train_size]
y_train = y_normalized[:train_size]
X_test = X_normalized[train_size:]
y_test = y_normalized[train_size:]
print("Training Features Shape:", X_train.shape)
print("Testing Features Shape:", X_test.shape)
print("Training Target Shape:", y_train.shape)
print("Testing Target Shape:", y_test.shape)

Training Features Shape: (56, 9)

Testing Features Shape: (25, 9)
Training Target Shape: (56,)
Testing Target Shape: (25,)

w= np.zeros((X_normalized.shape[1])) ###weight initialization

w.shape

(9,)

alpha=0.4 ##learning rate

iters=1500 ###iterations
batch_w,J_his = batch_gradient_descent(X_train,y_train,w,alpha,iters)
plt.plot(range(iters),J_his)
plt.xlabel('Iterations')
plt.ylabel('Cost')
plt.title('BGD Cost vs Iterations')
plt.show()
bgd=batch_w
print("WEIGHT VECTOR",bgd)

y_pred_bgd=X_test.dot(bgd.T)

WEIGHT VECTOR [0.21794334 0.10606424 0.0478828 0.03935448 0.03229864

0.03136558
0.11796494 0.06546174 0.03341064]

yp_unnorm=(y_pred_bgd*(ymax-ymin))+ymin
y_test_unnorm=(y_test*(ymax-ymin))+ymin

a=mean_abs_error(yp_unnorm,y_test_unnorm)
print("MEAN ABSOLUTE ERROR",a)

MEAN ABSOLUTE ERROR 1.1326579129012353

b=mean_square_error(yp_unnorm,y_test_unnorm)
print("MEAN SQUARE ERROR:",b)

MEAN SQUARE ERROR: 1.819265635873902

c=correcoff(yp_unnorm,y_test_unnorm)
print("CORRELATION COEFF:",c)

CORRELATION COEFF: 0.2602600569650748

d=r_squared(yp_unnorm,y_test_unnorm)
print("R2:",d)

R2: -226.79600202581813

plt.figure(figsize=(8, 6))
plt.plot(y_test_unnorm, label='Actual Output', color='blue',
marker='o')
plt.plot(yp_unnorm, label='Predicted Output', color='red', marker='x')
plt.xlabel('Sample Index')
plt.ylabel('Output Value')
plt.title('Predicted vs Actual Output (Line Plot)')
plt.legend()
plt.show()
alpha=0.4
iters=5000 ###iterations
w_n_l2,J_sgd_l2 = stochastic_gradient_descent(X_train,y_train,w,alpha,
iters)
plt.plot(range(iters),J_sgd_l2)
plt.xlabel('Iterations')
plt.ylabel('Cost')
plt.title('SGD Cost vs Iterations')
plt.show()
sgd=w_n_l2
print("WEIGHT VECTOR",bgd)
y_pred_sgd=X_test.dot(sgd.T)
yp_unnorm=(y_pred_sgd*(ymax-ymin))+ymin
y_test_unnorm=(y_test*(ymax-ymin))+ymin
a=mean_abs_error(yp_unnorm,y_test_unnorm)
print("MEAN ABSOLUTE ERROR",a)

b=mean_square_error(yp_unnorm,y_test_unnorm)
print("MEAN SQUARE ERROR:",b)
c=correcoff(y_test_unnorm, yp_unnorm)
print("CORRELATION COEFF:",c)
d=r_squared(yp_unnorm,y_test_unnorm)
print("R2:",d)
plt.figure(figsize=(8, 6))
plt.plot(y_test_unnorm, label='Actual Output', color='blue',
marker='o')
plt.plot(yp_unnorm, label='Predicted Output', color='red', marker='x')
plt.xlabel('Sample Index')
plt.ylabel('Output Value')
plt.title('Predicted vs Actual Output (Line Plot)')
plt.legend()
plt.show()

WEIGHT VECTOR [0.21794334 0.10606424 0.0478828 0.03935448 0.03229864

0.03136558
0.11796494 0.06546174 0.03341064]
MEAN ABSOLUTE ERROR 0.9617008469068318
MEAN SQUARE ERROR: 1.6948874101095208
CORRELATION COEFF: 0.7968621371120339
R2: -6.284048634553031
alpha=0.4
iters=2000 ###iterations
batch_size=15
mb_w_l1,J_mb_l1 = MB_gradient_descent(X_train,y_train,w,alpha, iters,
batch_size)
plt.plot(range(iters),J_mb_l1)
plt.xlabel('Iterations')
plt.ylabel('Cost')
plt.title('MBGD Cost vs Iterations')
plt.show()
mbgd=mb_w_l1

print("WEIGHT VECTOR",bgd)
y_pred_mbgd=X_test.dot(mbgd.T)
yp_unnorm=(y_pred_mbgd*(ymax-ymin))+ymin
y_test_unnorm=(y_test*(ymax-ymin))+ymin
a=mean_abs_error(yp_unnorm,y_test_unnorm)
print("MEAN ABSOLUTE ERROR",a)
b=mean_square_error(yp_unnorm,y_test_unnorm)
print("MEAN SQUARE ERROR:",b)
c=correcoff(yp_unnorm,y_test_unnorm)
print("CORRELATION COEFF:",c)
d=r_squared(yp_unnorm,y_test_unnorm)
print("R2:",d)
plt.figure(figsize=(8, 6))
plt.plot(y_test_unnorm, label='Actual Output', color='blue',
marker='o')
plt.plot(yp_unnorm, label='Predicted Output', color='red', marker='x')
plt.xlabel('Sample Index')
plt.ylabel('Output Value')
plt.title('Predicted vs Actual Output')
plt.legend()
plt.show()

WEIGHT VECTOR [0.21794334 0.10606424 0.0478828 0.03935448 0.03229864

0.03136558
0.11796494 0.06546174 0.03341064]
MEAN ABSOLUTE ERROR 1.0860545963179458
MEAN SQUARE ERROR: 1.7247709330182672
CORRELATION COEFF: 0.39688976236696366
R2: -293.6095175999243

'/content/drive': From Import Import As Import As Import As
No ratings yet
'/content/drive': From Import Import As Import As Import As
9 pages
Ai Last 5
No ratings yet
Ai Last 5
4 pages
ANN PR Code and Output
No ratings yet
ANN PR Code and Output
25 pages
Mlee Lab4
No ratings yet
Mlee Lab4
11 pages
CCC
No ratings yet
CCC
25 pages
Code Diamond
No ratings yet
Code Diamond
6 pages
Assignment No. 3: 1. Plot of Loss Function J Vs Number of Iterations
No ratings yet
Assignment No. 3: 1. Plot of Loss Function J Vs Number of Iterations
6 pages
Lib - NN-đã G P
No ratings yet
Lib - NN-đã G P
83 pages
Deeplg 3
No ratings yet
Deeplg 3
8 pages
Mlee 4
No ratings yet
Mlee 4
12 pages
Machine Learning Algorithms Overview
No ratings yet
Machine Learning Algorithms Overview
13 pages
Naive Bayes and Regression Techniques
No ratings yet
Naive Bayes and Regression Techniques
58 pages
Neural Network Code
No ratings yet
Neural Network Code
5 pages
NumPy Array Operations and Examples
No ratings yet
NumPy Array Operations and Examples
5 pages
DEEP LEARNING MANUAL Final
No ratings yet
DEEP LEARNING MANUAL Final
14 pages
Big Data Assignment - 7
No ratings yet
Big Data Assignment - 7
7 pages
Python ML Algorithms Guide
No ratings yet
Python ML Algorithms Guide
7 pages
Deep Record
No ratings yet
Deep Record
44 pages
Aiml Lab
No ratings yet
Aiml Lab
14 pages
Null 0
No ratings yet
Null 0
6 pages
Stochastic Gradient Descent in Python
No ratings yet
Stochastic Gradient Descent in Python
8 pages
Image Classification Handson-Image - Test
No ratings yet
Image Classification Handson-Image - Test
5 pages
Báo Cáo Java 4
No ratings yet
Báo Cáo Java 4
3 pages
22051001 (2)
No ratings yet
22051001 (2)
5 pages
Lab Report 03
No ratings yet
Lab Report 03
14 pages
Linear Reg 33
No ratings yet
Linear Reg 33
3 pages
ML Record Print
No ratings yet
ML Record Print
20 pages
ML Lab Manual
No ratings yet
ML Lab Manual
12 pages
Machine Learning CODE
No ratings yet
Machine Learning CODE
19 pages
Autoencoder From Scratch
No ratings yet
Autoencoder From Scratch
21 pages
CSV Data Processing and ML Algorithms
No ratings yet
CSV Data Processing and ML Algorithms
24 pages
Nibedita Dehury, 123CE0079, Assignment 7
No ratings yet
Nibedita Dehury, 123CE0079, Assignment 7
15 pages
Software Laboratory II Code
No ratings yet
Software Laboratory II Code
27 pages
Fruit Data Analysis and Classification
No ratings yet
Fruit Data Analysis and Classification
27 pages
X OR Problem Using DNN
No ratings yet
X OR Problem Using DNN
3 pages
MIT Ans
No ratings yet
MIT Ans
216 pages
Python Genetic Algorithm Example
No ratings yet
Python Genetic Algorithm Example
29 pages
Import Numpy As NP
No ratings yet
Import Numpy As NP
5 pages
Neural Net Python Sleep Study
No ratings yet
Neural Net Python Sleep Study
3 pages
Polynomial Regression Blogpost
No ratings yet
Polynomial Regression Blogpost
8 pages
Machine Learning Algorithm Demos
No ratings yet
Machine Learning Algorithm Demos
31 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
Bilal Ahmad Ai & DSS Assign # 03
No ratings yet
Bilal Ahmad Ai & DSS Assign # 03
7 pages
ML Journal External
No ratings yet
ML Journal External
14 pages
Chitsss PDF
No ratings yet
Chitsss PDF
1 page
Sofcomputing Da2
No ratings yet
Sofcomputing Da2
7 pages
Lab-5 Report
No ratings yet
Lab-5 Report
11 pages
Bacdeaf 23032025 115708 Split 1
No ratings yet
Bacdeaf 23032025 115708 Split 1
37 pages
B.Tech AI & DS: Data Science Lab
No ratings yet
B.Tech AI & DS: Data Science Lab
35 pages
PCA Implementation and Analysis
No ratings yet
PCA Implementation and Analysis
15 pages
Btech1007022 Lab5.1
No ratings yet
Btech1007022 Lab5.1
9 pages
ML Lab Record
No ratings yet
ML Lab Record
33 pages
Machine Learning Model Building
No ratings yet
Machine Learning Model Building
6 pages
Bananini Chimpanzini
No ratings yet
Bananini Chimpanzini
8 pages
Mlda - Lab
No ratings yet
Mlda - Lab
35 pages
Mercedes-Benz Greener Manufacturing Ai
0% (1)
Mercedes-Benz Greener Manufacturing Ai
16 pages
Bank Nifty PDF
No ratings yet
Bank Nifty PDF
16 pages
Soft Sensor Code
No ratings yet
Soft Sensor Code
4 pages
Soft Sensor Code
No ratings yet
Soft Sensor Code
4 pages
Vasti Marra Tee-Pinera: Objective
No ratings yet
Vasti Marra Tee-Pinera: Objective
7 pages
02 Metformin
No ratings yet
02 Metformin
9 pages
Goettner-Abendroth, H. - Rethinking 'Matriarchy' in Modern Matriarchal Studies Using Two Examples. The Khasi and The Musuo
No ratings yet
Goettner-Abendroth, H. - Rethinking 'Matriarchy' in Modern Matriarchal Studies Using Two Examples. The Khasi and The Musuo
26 pages
Sample CEP Report Comp
No ratings yet
Sample CEP Report Comp
26 pages
Physics Exam for Students
No ratings yet
Physics Exam for Students
2 pages
Gordon's Functional Health Pattern
100% (3)
Gordon's Functional Health Pattern
5 pages
High Density Orcharding
0% (1)
High Density Orcharding
2 pages
Data Analytics & Mining Course Guide
No ratings yet
Data Analytics & Mining Course Guide
2 pages
Sales Pipeline and Business Forecast
No ratings yet
Sales Pipeline and Business Forecast
27 pages
Ms. Jai Quotation
No ratings yet
Ms. Jai Quotation
2 pages
Garment Washing SOP for Quality Control
No ratings yet
Garment Washing SOP for Quality Control
9 pages
Geotextiles and Geomembranes
No ratings yet
Geotextiles and Geomembranes
13 pages
Organisation of Cell in The Human Body: Basic Unit of Life Organism
No ratings yet
Organisation of Cell in The Human Body: Basic Unit of Life Organism
1 page
Importance of Lesson Planning
No ratings yet
Importance of Lesson Planning
20 pages
Thompson 1996
No ratings yet
Thompson 1996
5 pages
Gulere Paul: Gulerep@gmail - Co M +25675285217 4 Kaliro, Uganda
No ratings yet
Gulere Paul: Gulerep@gmail - Co M +25675285217 4 Kaliro, Uganda
2 pages
Friendship Application Form
100% (1)
Friendship Application Form
3 pages
Supplier Selection Policy
No ratings yet
Supplier Selection Policy
7 pages
Engaging Ideas: A Professor's Guide
0% (1)
Engaging Ideas: A Professor's Guide
3 pages
"I Will Walk Among You": 00i-291 Harper 3p.indb 1 10/1/18 8:09 AM
No ratings yet
"I Will Walk Among You": 00i-291 Harper 3p.indb 1 10/1/18 8:09 AM
303 pages
1 - CEA - UAS Juni 2020
No ratings yet
1 - CEA - UAS Juni 2020
9 pages
ISO 10375: Ultrasonic Testing Standards
No ratings yet
ISO 10375: Ultrasonic Testing Standards
24 pages
Dynamic Load Management for EV Charging
No ratings yet
Dynamic Load Management for EV Charging
2 pages
Food Processing Module Week1 Day1 4
No ratings yet
Food Processing Module Week1 Day1 4
14 pages
2025 - Year 12 Subject Requirement List
No ratings yet
2025 - Year 12 Subject Requirement List
6 pages
Checklist For Electrical Safety Inspection
100% (5)
Checklist For Electrical Safety Inspection
1 page
Amazon Seller Acronyms Explained
No ratings yet
Amazon Seller Acronyms Explained
1 page
MCQ
100% (3)
MCQ
15 pages
Omron Programming Manual
No ratings yet
Omron Programming Manual
1,175 pages
Synthesis and Electrochemistry of LiNiMn2 - O4
No ratings yet
Synthesis and Electrochemistry of LiNiMn2 - O4
9 pages

Mlee Lab1

Uploaded by

Mlee Lab1

Uploaded by

from google.

colab import drive

def stochastic_gradient_descent(X,y,w,alpha, iters):

def MB_gradient_descent(X,y,w,alpha, iters, batch_size):

def r_squared(y_true, y_pred):

X = data.iloc[:, :-1] # All rows, all columns except the last

ymin = np.min(y, axis = 0)

Training Features Shape: (56, 9)

w= np.zeros((X_normalized.shape[1])) ###weight initialization

alpha=0.4 ##learning rate

WEIGHT VECTOR [0.21794334 0.10606424 0.0478828 0.03935448 0.03229864

MEAN ABSOLUTE ERROR 1.1326579129012353

MEAN SQUARE ERROR: 1.819265635873902

CORRELATION COEFF: 0.2602600569650748

WEIGHT VECTOR [0.21794334 0.10606424 0.0478828 0.03935448 0.03229864

WEIGHT VECTOR [0.21794334 0.10606424 0.0478828 0.03935448 0.03229864

You might also like