0% found this document useful (0 votes)

29 views5 pages

Code

Uploaded by

xahage9739

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

29 views5 pages

Code

Uploaded by

xahage9739

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 5

Assignment 1

Name: SAIKAT MOI

Roll Number: 20CS10050
# import all the necessary libraries here
import pandas as pd
import numpy as np
import random
import matplotlib.pyplot as plt
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split

data = pd.read_csv('../../dataset/linear-regression.csv')
print(data)

fixed acidity volatile acidity citric acid residual sugar

chlorides \
0 7.4 0.700 0.00 1.9
0.076
1 7.8 0.880 0.00 2.6
0.098
2 7.8 0.760 0.04 2.3
0.092
3 11.2 0.280 0.56 1.9
0.075
4 7.4 0.700 0.00 1.9
0.076
... ... ... ... ...
...
1594 6.2 0.600 0.08 2.0
0.090
1595 5.9 0.550 0.10 2.2
0.062
1596 6.3 0.510 0.13 2.3
0.076
1597 5.9 0.645 0.12 2.0
0.075
1598 6.0 0.310 0.47 3.6
0.067

free sulfur dioxide total sulfur dioxide density pH

sulphates \
0 11.0 34.0 0.99780 3.51
0.56
1 25.0 67.0 0.99680 3.20
0.68
2 15.0 54.0 0.99700 3.26
0.65
3 17.0 60.0 0.99800 3.16
0.58
4 11.0 34.0 0.99780 3.51
0.56
... ... ... ... ...
...
1594 32.0 44.0 0.99490 3.45
0.58
1595 39.0 51.0 0.99512 3.52
0.76
1596 29.0 40.0 0.99574 3.42
0.75
1597 32.0 44.0 0.99547 3.57
0.71
1598 18.0 42.0 0.99549 3.39
0.66

alcohol quality
0 9.4 5
1 9.8 5
2 9.8 5
3 9.8 6
4 9.4 5
... ... ...
1594 10.5 5
1595 11.2 6
1596 11.0 6
1597 10.2 5
1598 11.0 6

[1599 rows x 12 columns]

X = data.drop(columns=['quality'])
y = data['quality']

# Feature scaling is a common preprocessing step in machine learning

that helps improve the performance and convergence
scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)

X_train, X_temp, y_train, y_temp = train_test_split(X_scaled, y,

test_size=0.5, random_state=42)
X_val, X_test, y_val, y_test = train_test_split(X_temp, y_temp,
test_size=0.4, random_state=42)

print("Train set shapes - X:", X_train.shape, "y:", y_train.shape)

print("Validation set shapes - X:", X_val.shape, "y:", y_val.shape)
print("Test set shapes - X:", X_test.shape, "y:", y_test.shape)
Train set shapes - X: (799, 11) y: (799,)
Validation set shapes - X: (480, 11) y: (480,)
Test set shapes - X: (320, 11) y: (320,)

# concatenating the column vector of ones with the X_train matrix,

effectively adding a new column to the beginning of X_train
# bias term allows the model to learn an offset from the origin.

X_train_with_bias = np.c_[np.ones((X_train.shape[0], 1)), X_train]

# Normal Equation θ = (X^T X)^(-1) X^T y

theta = np.linalg.inv(X_train_with_bias.T @ X_train_with_bias) @
X_train_with_bias.T @ y_train

# Predict on the test set

X_test_with_bias = np.c_[np.ones((X_test.shape[0], 1)), X_test]
y_test_pred = X_test_with_bias @ theta

# Calculate R-squared on the test set

ssr = np.sum(( y_test-y_test_pred ) ** 2)

sst = np.sum((y_test - np.mean(y_test)) ** 2)
r2 = 1 - (ssr / sst)

# RMSE = sqrt((1 / n) * Σ(y_pred - y_actual)^2)

# Calculate RMSE on the test set

rmse = np.sqrt(np.mean((y_test - y_test_pred) ** 2))

print("Test Set - R-squared:", r2)

print("Test Set - Root Mean Squared Error (RMSE):", rmse)

Test Set - R-squared: 0.3967805084557149

Test Set - Root Mean Squared Error (RMSE): 0.6657115962476505

# the mean squared error loss between the predicted values and the
actual target values.
def compute_loss(X, y, theta):
y_pred = X @ theta
loss = np.mean((y_pred - y) ** 2)
return loss

# ∇(MSE) = -2 * (X^T @ (y - Xθ)) / N

def gradient_ascent(X, y, theta, learning_rate, num_iterations):

losses = []
for _ in range(num_iterations):
y_pred = X @ theta
gradient = -2 * (X.T @ (y - y_pred)) / len(y)
theta -= learning_rate * gradient
loss = compute_loss(X, y, theta)
losses.append(loss)
return theta, losses

learning_rates = [0.01, 0.001, 0.0001]

num_iterations = 50000

for lr in learning_rates:
theta_initial = np.zeros(X_train.shape[1] + 1) # +1 for the bias
term
X_train_with_bias = np.c_[np.ones((X_train.shape[0], 1)), X_train]
theta_optimized, losses = gradient_ascent(X_train_with_bias,
y_train, theta_initial, lr, num_iterations)

plt.plot(range(num_iterations), losses, label=f'lr = {lr}')

X_test_with_bias = np.c_[np.ones((X_test.shape[0], 1)), X_test]

y_test_pred = X_test_with_bias @ theta_optimized

# Calculate R-squared on the test set

ssr = np.sum(( y_test-y_test_pred ) ** 2)
sst = np.sum((y_test - np.mean(y_test)) ** 2)

r2 = 1-(ssr / sst)

# Calculate RMSE on the test set

rmse = np.sqrt(np.mean((y_test - y_test_pred) ** 2))

print(f"Learning Rate: {lr}")

print("Test Set - R-squared:", r2)
print("Test Set - Root Mean Squared Error (RMSE):", rmse)
print()

plt.xlabel('Iteration')
plt.ylabel('Loss')
plt.title('Loss Function vs. Iteration for Different Learning Rates')
plt.legend()
plt.show()

Learning Rate: 0.01

Test Set - R-squared: 0.3967805084557158
Test Set - Root Mean Squared Error (RMSE): 0.6657115962476501

Learning Rate: 0.001

Test Set - R-squared: 0.3967803979339991
Test Set - Root Mean Squared Error (RMSE): 0.6657116572333991

Learning Rate: 0.0001

Test Set - R-squared: 0.39639733535434873
Test Set - Root Mean Squared Error (RMSE): 0.6659229971434986

ML LAB 12 - Jupyter Notebook
No ratings yet
ML LAB 12 - Jupyter Notebook
11 pages
Wine Quality Prediction
No ratings yet
Wine Quality Prediction
6 pages
Logistic Regression Wine Analysis
No ratings yet
Logistic Regression Wine Analysis
3 pages
Karisma 23011101119 Eda Rec
No ratings yet
Karisma 23011101119 Eda Rec
88 pages
Quality Prediction
No ratings yet
Quality Prediction
20 pages
ML Program 7, 8,9 And10
No ratings yet
ML Program 7, 8,9 And10
12 pages
Practical04.ipynb - Colab
No ratings yet
Practical04.ipynb - Colab
2 pages
Stratified K-Fold in Scikit-Learn
No ratings yet
Stratified K-Fold in Scikit-Learn
6 pages
Assignment4 VidulGarg
No ratings yet
Assignment4 VidulGarg
14 pages
Regresi A
No ratings yet
Regresi A
11 pages
Ams 427 Statistical Model Building
No ratings yet
Ams 427 Statistical Model Building
5 pages
Random Forest
No ratings yet
Random Forest
5 pages
EXP - 7 - Prasham Doshi - 22bec097
No ratings yet
EXP - 7 - Prasham Doshi - 22bec097
7 pages
Data Mining Lab Manual
No ratings yet
Data Mining Lab Manual
7 pages
4.4. Data Standardization - Ipynb - Colaboratory
No ratings yet
4.4. Data Standardization - Ipynb - Colaboratory
1 page
Submission of Term Work': Subject - Cpms
No ratings yet
Submission of Term Work': Subject - Cpms
25 pages
Data Mining 1 Practical File-1
No ratings yet
Data Mining 1 Practical File-1
24 pages
Tables Perf
No ratings yet
Tables Perf
3 pages
Labpg3.ipynb - Colab
No ratings yet
Labpg3.ipynb - Colab
2 pages
Logistic Regression for Red Wine Quality
100% (1)
Logistic Regression for Red Wine Quality
10 pages
KNN - Jupyter Notebook
No ratings yet
KNN - Jupyter Notebook
7 pages
Scikit-Learn for Data Scientists
No ratings yet
Scikit-Learn for Data Scientists
32 pages
Quality Prediction Checkpoint
No ratings yet
Quality Prediction Checkpoint
14 pages
DATA SCIENCE IDC 302 End Sem Project
No ratings yet
DATA SCIENCE IDC 302 End Sem Project
1 page
Standard Normal Distribution Table
No ratings yet
Standard Normal Distribution Table
3 pages
Silicon Parameter File
No ratings yet
Silicon Parameter File
49 pages
ML FINAL Lab Manual
No ratings yet
ML FINAL Lab Manual
7 pages
Week 4 Naive Bayes Classifier
No ratings yet
Week 4 Naive Bayes Classifier
2 pages
IEEE 30-Bus Test System Analysis
No ratings yet
IEEE 30-Bus Test System Analysis
6 pages
Anexo Estadístico Tabla de Distribución Normal: Escuela de Ingeniería Industrial
No ratings yet
Anexo Estadístico Tabla de Distribución Normal: Escuela de Ingeniería Industrial
2 pages
Tablas Estadisticas PDF
No ratings yet
Tablas Estadisticas PDF
2 pages
Normal Distribution Table
No ratings yet
Normal Distribution Table
2 pages
Como PDF
No ratings yet
Como PDF
2 pages
Tabla de Distribución Normal Z
No ratings yet
Tabla de Distribución Normal Z
2 pages
Memoriza Estadisticas PDF
No ratings yet
Memoriza Estadisticas PDF
2 pages
Normal Distribution Table
No ratings yet
Normal Distribution Table
2 pages
Intento PDF
No ratings yet
Intento PDF
2 pages
Hola PDF
No ratings yet
Hola PDF
2 pages
Linear Regression for Beginners
No ratings yet
Linear Regression for Beginners
6 pages
%trabajamos Con Los Componentes Metanol y 1-Hepteno %componente Metanol
No ratings yet
%trabajamos Con Los Componentes Metanol y 1-Hepteno %componente Metanol
3 pages
Appendix
No ratings yet
Appendix
12 pages
Project 3 - Diabetes Prediction - Ipynb - Colab
No ratings yet
Project 3 - Diabetes Prediction - Ipynb - Colab
4 pages
Criterio de Ross: Datos E.C. NV MULA: FD (1 - (E/VUT) 1.4) F E.C. R E.C.RE E.C.Rep E.C.D
No ratings yet
Criterio de Ross: Datos E.C. NV MULA: FD (1 - (E/VUT) 1.4) F E.C. R E.C.RE E.C.Rep E.C.D
6 pages
Assignment 03
No ratings yet
Assignment 03
6 pages
Regression Statistics
No ratings yet
Regression Statistics
17 pages
T Student
No ratings yet
T Student
2 pages
Full Z Score Table
No ratings yet
Full Z Score Table
2 pages
Neural Network Regression for Alloy Data
No ratings yet
Neural Network Regression for Alloy Data
38 pages
Tabla Poisson 022021 Final
No ratings yet
Tabla Poisson 022021 Final
5 pages
Model Training
No ratings yet
Model Training
6 pages
Lab3 (Main) .Ipynb - Colab
No ratings yet
Lab3 (Main) .Ipynb - Colab
1 page
Model Evaluation and Hyperparameter Tuning
No ratings yet
Model Evaluation and Hyperparameter Tuning
11 pages
F Error
No ratings yet
F Error
27 pages
MNIST Digit Recognition Guide
No ratings yet
MNIST Digit Recognition Guide
8 pages
Classeur 1
No ratings yet
Classeur 1
21 pages
Machine Learning - Lab Record
No ratings yet
Machine Learning - Lab Record
43 pages
PDF 08 0247
No ratings yet
PDF 08 0247
2 pages
Tabele pentru Calcularea Entropiilor
No ratings yet
Tabele pentru Calcularea Entropiilor
8 pages
Haz Plot Fail Modes For Moodle
No ratings yet
Haz Plot Fail Modes For Moodle
16 pages
Shelf Life Estimation
No ratings yet
Shelf Life Estimation
35 pages
Forensic Facial Reconstruction Guide
100% (4)
Forensic Facial Reconstruction Guide
39 pages
Overview Management and Exploitation of Fishery Resources of Cameroon PDF
No ratings yet
Overview Management and Exploitation of Fishery Resources of Cameroon PDF
70 pages
BIBO Stability in Digital Control Systems
No ratings yet
BIBO Stability in Digital Control Systems
51 pages
Grade 1 Term 1 Maths Plan
No ratings yet
Grade 1 Term 1 Maths Plan
15 pages
X - Vibrate Air To A Measured Timing and You Have The - Paranormal - 4chan
No ratings yet
X - Vibrate Air To A Measured Timing and You Have The - Paranormal - 4chan
3 pages
Spivak's Postcolonial Criticism
0% (1)
Spivak's Postcolonial Criticism
5 pages
Measuring Personal-Group Relations
No ratings yet
Measuring Personal-Group Relations
7 pages
Political
No ratings yet
Political
194 pages
Non Violent Communication
100% (5)
Non Violent Communication
20 pages
Sterilization Biological Indicators
No ratings yet
Sterilization Biological Indicators
4 pages
My Limitations
No ratings yet
My Limitations
83 pages
Black and White End of The Year Super Student Certificates
No ratings yet
Black and White End of The Year Super Student Certificates
14 pages
Ashtar - God, Man, or Machine
No ratings yet
Ashtar - God, Man, or Machine
4 pages
Paper Strip Game
No ratings yet
Paper Strip Game
6 pages
First Division: THE PEOPLE OF THE PHILIPPINES, Plaintiff-Appellee, vs. BRIAN MERCADO y SARMIENTO, Accused-Appellant
No ratings yet
First Division: THE PEOPLE OF THE PHILIPPINES, Plaintiff-Appellee, vs. BRIAN MERCADO y SARMIENTO, Accused-Appellant
10 pages
Final Project Report PDF
No ratings yet
Final Project Report PDF
35 pages
EIA For Maize & Wheat Milling Plant DEI PDF
100% (3)
EIA For Maize & Wheat Milling Plant DEI PDF
110 pages
PLSQL Study Material
No ratings yet
PLSQL Study Material
13 pages
Revitalizing Albania's Industrial Heritage
No ratings yet
Revitalizing Albania's Industrial Heritage
16 pages
Group Dynamics and Development Stages
No ratings yet
Group Dynamics and Development Stages
18 pages
Leverage Leadership: A Book Review
No ratings yet
Leverage Leadership: A Book Review
8 pages
African Philosophy of Education
0% (1)
African Philosophy of Education
6 pages
On Sequential Analysis
0% (1)
On Sequential Analysis
9 pages
Introduction To Power System Reliability Evaluation: Availability (AV) and Forced Outage Rate (FOR)
No ratings yet
Introduction To Power System Reliability Evaluation: Availability (AV) and Forced Outage Rate (FOR)
9 pages
Fusion Gdms
No ratings yet
Fusion Gdms
14 pages
MBA HR Case Study Analysis
No ratings yet
MBA HR Case Study Analysis
16 pages
LeNS Proceedings
No ratings yet
LeNS Proceedings
899 pages
English Vocabulary for Students
No ratings yet
English Vocabulary for Students
17 pages
Calibration Procedure for Air Gauges
100% (1)
Calibration Procedure for Air Gauges
3 pages