0% found this document useful (0 votes)

25 views14 pages

Btech1007022 Lab5

The document contains three separate programs focused on data analysis and machine learning. Program 1 implements linear regression to predict salary based on experience, Program 2 uses linear regression on an insurance dataset, and Program 3 applies logistic regression to classify species in the Iris dataset. Each program includes data loading, preprocessing, model training, and evaluation steps.

Uploaded by

C30 Md arbab

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as RTF, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

25 views14 pages

Btech1007022 Lab5

Uploaded by

C30 Md arbab

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as RTF, PDF, TXT or read online on Scribd

You are on page 1/ 14

Name-Ankit Kumar

Roll - BTECH/10066/22

LAB-5

Program1:

import csv

import numpy as np

import matplotlib.pyplot as plt

# Load the data

data = []

with open('Salary_data.csv', 'r') as file:

reader = csv.reader(file)

next(reader) # Skip header

for row in reader:

data.append([float(row[0]), float(row[1])])

# Separate the data into Experience (X) and Salary (Y)

X = np.array([row[0] for row in data])

Y = np.array([row[1] for row in data])

# Plot Experience vs. Salary

plt.scatter(X, Y, color='blue')

plt.xlabel('Experience (years)')

plt.ylabel('Salary')

plt.title('Experience vs. Salary')

plt.show()

# Initialize parameters

m = 0 # Slope

b = 0 # Intercept

learning_rate = 0.01

iterations = 1000

n = len(X)

# Function to compute Mean Squared Error

def compute_mse(X, Y, m, b):

total_error = 0

for i in range(len(X)):

total_error += (Y[i] - (m * X[i] + b)) ** 2

return total_error / n

# Gradient Descent

errors = []
for _ in range(iterations):

m_grad = 0

b_grad = 0

for i in range(len(X)):

m_grad += -2 * X[i] * (Y[i] - (m * X[i] + b))

b_grad += -2 * (Y[i] - (m * X[i] + b))

m -= (m_grad / n) * learning_rate

b -= (b_grad / n) * learning_rate

mse = compute_mse(X, Y, m, b)

errors.append(mse)

print(f"Final Parameters: m = {m}, b = {b}")

# Plot Training Error at Each Iteration

plt.plot(range(iterations), errors, color='red')

plt.xlabel('Iteration')

plt.ylabel('Mean Squared Error')

plt.title('Training Error at Each Iteration')

plt.show()

# Plot Experience vs. Salary with Best Fit Line

plt.scatter(X, Y, color='blue')
plt.plot(X, [m * x + b for x in X], color='red') # Best fit line

plt.xlabel('Experience (years)')

plt.ylabel('Salary')

plt.title('Experience vs. Salary with Best Fit Line')

plt.show()

OUTPUT:
Program2:
import pandas as pd
from sklearn.preprocessing import MinMaxScaler
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error

# Load the dataset

data = pd.read_csv('insurance.csv')
# Display the top 10 samples of the dataset
print(data.head(10))

# Display the features and label

features = data.columns[:-1]
label = data.columns[-1]

print("Features (Independent Variables):", features.tolist())

print("Label (Dependent Variable):", label)

# Remove missing value samples

data = data.dropna()

print("Number of samples after removing missing values:", len(data))

# Convert categorical variables to numeric using one-hot encoding

data = pd.get_dummies(data, columns=['sex', 'smoker', 'region'], drop_first=True)

# Update the features to reflect one-hot encoded columns

features = data.columns[:-1]

# Normalize the feature set

scaler = MinMaxScaler()
data[features] = scaler.fit_transform(data[features])
print("Normalized feature set:")
print(data.head(10))

# Split the data into training and testing sets

X = data[features]
y = data[label]
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,
random_state=42)

print("Number of training samples:", len(X_train))

print("Number of testing samples:", len(X_test))

# Train the regression model

model = LinearRegression()
model.fit(X_train, y_train)

print("Model coefficients:", model.coef_)

print("Model intercept:", model.intercept_)

# Predict the test data

y_pred = model.predict(X_test)

# Calculate and display the testing error (Mean Squared Error)

mse = mean_squared_error(y_test, y_pred)
print("Testing Error (Mean Squared Error):", mse)

OUTPUT:
Program3:
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder
from sklearn.metrics import accuracy_score

# Load the Iris dataset from the local CSV file

data = pd.read_csv('iris.csv')

# Display the top 10 samples of the dataset

print(data.head(10))

# Check the column names to identify the target variable

print("Column names:", data.columns)

# The target variable column name is 'Species'

target_variable = 'Species'

# Encode the class labels into numeric values

label_encoder = LabelEncoder()
data[target_variable] = label_encoder.fit_transform(data[target_variable])

# Split the data into features (X) and labels (y)

X = data.iloc[:, 1:-1] # Exclude the 'Id' column and the target variable column
y = data.iloc[:, -1]

# Split the data into training and testing sets (80% training, 20% testing)
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,
random_state=42)

# Logistic Regression implementation

class LogisticRegression:
def __init__(self, learning_rate=0.01, iterations=1000):
self.learning_rate = learning_rate
self.iterations = iterations

def sigmoid(self, z):

return 1 / (1 + np.exp(-z))

def fit(self, X, y):

self.m, self.n = X.shape
self.weights = np.zeros(self.n)
self.bias = 0
self.errors = []
epsilon = 1e-7 # Small epsilon value to avoid log(0)

for _ in range(self.iterations):
linear_model = np.dot(X, self.weights) + self.bias
y_pred = self.sigmoid(linear_model)

dw = (1 / self.m) * np.dot(X.T, (y_pred - y))

db = (1 / self.m) * np.sum(y_pred - y)

self.weights -= self.learning_rate * dw
self.bias -= self.learning_rate * db

loss = - (1 / self.m) * np.sum(y * np.log(y_pred + epsilon) + (1 - y) * np.log(1

- y_pred + epsilon))
self.errors.append(loss)

def predict(self, X):

linear_model = np.dot(X, self.weights) + self.bias
y_pred = self.sigmoid(linear_model)
return [1 if i > 0.5 else 0 for i in y_pred]

# Train the logistic regression model

log_reg = LogisticRegression(learning_rate=0.01, iterations=1000)
log_reg.fit(X_train, y_train)

print("Model weights:", log_reg.weights)

print("Model bias:", log_reg.bias)

# Predict the test data

y_pred = log_reg.predict(X_test)
# Calculate and display the accuracy
accuracy = accuracy_score(y_test, y_pred)
print("Accuracy:", accuracy)

OUTPUT:

Btech1007022 Lab5.1
No ratings yet
Btech1007022 Lab5.1
9 pages
Machine Learning Hands-On
100% (1)
Machine Learning Hands-On
18 pages
Da 012307
No ratings yet
Da 012307
8 pages
Aiml Practicals
No ratings yet
Aiml Practicals
22 pages
ML Regression & Classification Guide
100% (1)
ML Regression & Classification Guide
45 pages
Aiml Ex 4-7
No ratings yet
Aiml Ex 4-7
8 pages
Sales and Regression Data Generation
No ratings yet
Sales and Regression Data Generation
30 pages
Practicalpgm ML
No ratings yet
Practicalpgm ML
33 pages
Machine Learning
No ratings yet
Machine Learning
10 pages
ML Prac 1
No ratings yet
ML Prac 1
4 pages
B.Tech AI & DS: Data Science Lab
No ratings yet
B.Tech AI & DS: Data Science Lab
35 pages
ML Lab Manual
No ratings yet
ML Lab Manual
17 pages
Python Simple Linear Regression Guide
No ratings yet
Python Simple Linear Regression Guide
14 pages
Naive Bayes and Regression Techniques
No ratings yet
Naive Bayes and Regression Techniques
58 pages
Python 1
No ratings yet
Python 1
3 pages
Data Mining Practicals
No ratings yet
Data Mining Practicals
22 pages
Assignment 1
No ratings yet
Assignment 1
5 pages
Machine Learning Lab Assignments
100% (2)
Machine Learning Lab Assignments
23 pages
Print Out ML - Finallllllllllllllll
No ratings yet
Print Out ML - Finallllllllllllllll
11 pages
1st PGM
No ratings yet
1st PGM
10 pages
ML External Xerox
No ratings yet
ML External Xerox
1 page
Data Analytics
No ratings yet
Data Analytics
10 pages
Experiment No.8
No ratings yet
Experiment No.8
5 pages
Stochastic Gradient Descent in Python
No ratings yet
Stochastic Gradient Descent in Python
8 pages
Sofcomputing Da2
No ratings yet
Sofcomputing Da2
7 pages
Lab Exam ... Roll No 24cs4103
No ratings yet
Lab Exam ... Roll No 24cs4103
4 pages
Iris Dataset EDA & ML Techniques
100% (2)
Iris Dataset EDA & ML Techniques
24 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
DL Lab 5
No ratings yet
DL Lab 5
3 pages
Machine Learning Lab
No ratings yet
Machine Learning Lab
20 pages
Python ML Algorithms Guide
No ratings yet
Python ML Algorithms Guide
7 pages
Task 1
No ratings yet
Task 1
5 pages
Machine Learning Practical Exercises
100% (1)
Machine Learning Practical Exercises
12 pages
Da Lab Mannual
No ratings yet
Da Lab Mannual
25 pages
ML Lab Programs For Exam
No ratings yet
ML Lab Programs For Exam
10 pages
C2W3 Lab 01 Model Evaluation and Selection
No ratings yet
C2W3 Lab 01 Model Evaluation and Selection
21 pages
Easy Pract ML
No ratings yet
Easy Pract ML
7 pages
ML Lab Programs
No ratings yet
ML Lab Programs
9 pages
ML Record Print
No ratings yet
ML Record Print
20 pages
C2W3 Lab 01 Model Evaluation and Selection
No ratings yet
C2W3 Lab 01 Model Evaluation and Selection
21 pages
Lecture-2 Unit 2
No ratings yet
Lecture-2 Unit 2
56 pages
ML Lab 01999676272
No ratings yet
ML Lab 01999676272
12 pages
ML Internal Questions
No ratings yet
ML Internal Questions
15 pages
ML
No ratings yet
ML
17 pages
MD Asaduzzaman - 213002257
No ratings yet
MD Asaduzzaman - 213002257
3 pages
ML Lab Prgms Split
No ratings yet
ML Lab Prgms Split
3 pages
Simple Linear Regression
No ratings yet
Simple Linear Regression
11 pages
Zerox Ready
No ratings yet
Zerox Ready
21 pages
ML All Projectpdf Removed
No ratings yet
ML All Projectpdf Removed
41 pages
Data Preprocessing Techniques in Python
No ratings yet
Data Preprocessing Techniques in Python
27 pages
AIML Project
No ratings yet
AIML Project
4 pages
Machine Learning Model Evaluation
No ratings yet
Machine Learning Model Evaluation
437 pages
Machine Learning Lab Manual 2021-22
No ratings yet
Machine Learning Lab Manual 2021-22
23 pages
Shobit Sharma (2124399) ML Lab File PDF
No ratings yet
Shobit Sharma (2124399) ML Lab File PDF
19 pages
Chapter 6 - Advanced Machine Learning PDF
No ratings yet
Chapter 6 - Advanced Machine Learning PDF
37 pages
Linear Regression Analysis Guide
No ratings yet
Linear Regression Analysis Guide
20 pages
Machine Learning Practicals
No ratings yet
Machine Learning Practicals
30 pages
1
No ratings yet
1
13 pages
Analytical Voltage Sensitivity-Based Distributed Volt - Var Control For Mitigating Voltage-Violations in Low-Voltage Distribution Networks
No ratings yet
Analytical Voltage Sensitivity-Based Distributed Volt - Var Control For Mitigating Voltage-Violations in Low-Voltage Distribution Networks
11 pages
Tooling For Composites and Aerospace Materials: Guhring Coating and Reconditioning Services The Tool Company
No ratings yet
Tooling For Composites and Aerospace Materials: Guhring Coating and Reconditioning Services The Tool Company
4 pages
라온
No ratings yet
라온
8 pages
Automa General Catalog
No ratings yet
Automa General Catalog
44 pages
Understanding Very Fast Transient Overvoltages in GIS
100% (1)
Understanding Very Fast Transient Overvoltages in GIS
21 pages
BioChemistry 6th Edition by Reginald H. Garrett - Get The Ebook in PDF Format For A Complete Experience
100% (3)
BioChemistry 6th Edition by Reginald H. Garrett - Get The Ebook in PDF Format For A Complete Experience
48 pages
Aspheric Lenses - Optometry Today
No ratings yet
Aspheric Lenses - Optometry Today
4 pages
Sub Station Equipment
No ratings yet
Sub Station Equipment
150 pages
EMTL 250 Lab 1 - Tensile Lab Handout 2018
No ratings yet
EMTL 250 Lab 1 - Tensile Lab Handout 2018
5 pages
ASM - PART1 - Data Structures and Algorithms - SE07204 - LE - NGOC - TIEN - BH01688
No ratings yet
ASM - PART1 - Data Structures and Algorithms - SE07204 - LE - NGOC - TIEN - BH01688
46 pages
15 - Analysis+of+Low+Power+16 Bit+Processor+Using+Cadence+ +90nm+Foundry+Technology
No ratings yet
15 - Analysis+of+Low+Power+16 Bit+Processor+Using+Cadence+ +90nm+Foundry+Technology
28 pages
SAPSCRIPT To PDF
83% (6)
SAPSCRIPT To PDF
15 pages
Recovery of Propionic Acid
No ratings yet
Recovery of Propionic Acid
24 pages
Write The Value of This Expression As A Whole Number. (20 + 40 + 60 + 80 + 100 + 120) - (10 + 30 + 50 + 70 + 90 + 110)
100% (1)
Write The Value of This Expression As A Whole Number. (20 + 40 + 60 + 80 + 100 + 120) - (10 + 30 + 50 + 70 + 90 + 110)
12 pages
Aco TSP
No ratings yet
Aco TSP
7 pages
Calculations in Volumetric Analysis 2023 B
No ratings yet
Calculations in Volumetric Analysis 2023 B
10 pages
Methods and Technologies For Measuring The Earths Gravity Field Parameters V G Peshekhonov Download
100% (1)
Methods and Technologies For Measuring The Earths Gravity Field Parameters V G Peshekhonov Download
79 pages
Rice Husker Construction Manual - Appropedia - The Sustainability Wiki PDF
No ratings yet
Rice Husker Construction Manual - Appropedia - The Sustainability Wiki PDF
17 pages
2013 Lehtonen
No ratings yet
2013 Lehtonen
11 pages
SP 1201
No ratings yet
SP 1201
42 pages
BookAbstracts IMIL2024 FINAL 2
No ratings yet
BookAbstracts IMIL2024 FINAL 2
177 pages
Neural Networks for Time Series Analysis
No ratings yet
Neural Networks for Time Series Analysis
24 pages
Practice Questions For List Tuple Set and Dictionary and Functions
No ratings yet
Practice Questions For List Tuple Set and Dictionary and Functions
36 pages
Chapter 10 - Composite Beams: Flexural Strength
No ratings yet
Chapter 10 - Composite Beams: Flexural Strength
7 pages
Mystic Numbers & Pythagorean Lore
100% (1)
Mystic Numbers & Pythagorean Lore
87 pages
Hankinson PDF
No ratings yet
Hankinson PDF
8 pages
BISS-E Technical Specification
No ratings yet
BISS-E Technical Specification
16 pages
Product Information DFG Tfg425-435
No ratings yet
Product Information DFG Tfg425-435
4 pages
Bank Exam 2024 Checklist Guide
No ratings yet
Bank Exam 2024 Checklist Guide
103 pages
Datasheet 2
No ratings yet
Datasheet 2
31 pages