0% found this document useful (0 votes)

4 views12 pages

Ailab 2

The document contains multiple sections demonstrating various machine learning techniques using Python, including logistic regression for diabetes prediction, Naive Bayes for spam classification, K-Means clustering on the Iris dataset, and decision trees for species classification. Each section includes data preprocessing, model training, evaluation metrics, and visualizations such as confusion matrices and scatter plots. The document illustrates practical applications of machine learning algorithms with real datasets.

Uploaded by

nisthulasmadankollan

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

4 views12 pages

Ailab 2

Uploaded by

nisthulasmadankollan

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

import pandas as pd

record = pd.read_csv("/content/diabetes.csv")
x = record.drop('Outcome',axis = 1)
y = record['Outcome']
from sklearn.model_selection import train_test_split
x_train,x_test,y_train,y_test = train_test_split(x,y,test_size = 0.25,random_state = 16)
from sklearn.linear_model import LogisticRegression
logreg = LogisticRegression(random_state=16,max_iter=1000)
logreg.fit(x_train,y_train)
y_pred = logreg.predict(x_test)
from sklearn import metrics
cnf_matrix = metrics.confusion_matrix(y_test,y_pred)
cnf_matrix
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn import metrics # Import metrics here
from sklearn.linear_model import LogisticRegression
from sklearn.model_selection import train_test_split
import pandas as pd

# Load data
record = pd.read_csv("/content/diabetes.csv")

# Prepare data
x = record.drop('Outcome',axis = 1)
y = record['Outcome']
x_train,x_test,y_train,y_test = train_test_split(x,y,test_size = 0.25,random_state = 16)

# Train model
logreg = LogisticRegression(random_state=16,max_iter=1000)
logreg.fit(x_train,y_train)

# Define y_test and y_pred

y_pred = logreg.predict(x_test)

# Calculate confusion matrix

cnf_matrix = metrics.confusion_matrix(y_test, y_pred)

plt.figure(figsize=(9,9))
sns.heatmap(cnf_matrix, annot=True, fmt=".0f", linewidths=.5, square = True, cmap = 'Blues_r');
plt.ylabel('Actual label');
plt.xlabel('Predicted label');
all_sample_title = 'Accuracy Score: {0}'.format(logreg.score(x_test, y_test))
plt.title(all_sample_title, size = 15);
plt.show()
output:

array([[116, 9],
[ 25, 42]])
import numpy as np
#Activation function
def sigmoid(x):
return 1/(1+np.exp(-x))
X=np.array([[1,0,0],[1,0,1],[1,1,0],[1,1,1]])
Tj=([[0],[1],[1],[0]])
#initial random weight
np.random.seed(42)
W1=np.random.randn(3,4)
W2=np.random.randn(4,1)
lr=0.1
epoch=10000

for epoch in range(epoch):

Ij_hidden=np.dot(X,W1) #net input of hidden layer
Oj_hidden=sigmoid(Ij_hidden) #output of hidden layer

Ij_output=np.dot(Oj_hidden,W2) #net input of output layer

Oj_output=sigmoid(Ij_output) #final output(y_pred)

#error at output layer

Err_output=Oj_output*(1-Oj_output)*(Tj-Oj_output)

#error at hidden layer

Err_hidden=Oj_hidden*(1-Oj_hidden)*np.dot(Err_output,W2.T)

#Update weight
W2+=lr*np.dot(Oj_hidden.T,Err_output) #wij for W2
W1+=lr*np.dot(X.T,Err_hidden) #wij for W1

#print error occasionally

if epoch % 2000 == 0:
E=0.5*np.sum((Tj-Oj_output)**2)
print(f"Epoch:{epoch},Error:{E:.4f}")

print("Predicted output")
print(Oj_output)
Epoch:0,Error:0.8641
Epoch:2000,Error:0.2243
Epoch:4000,Error:0.0213
Epoch:6000,Error:0.0089
Epoch:8000,Error:0.0055
Predicted output
[[0.02646161]
[0.95237071]
[0.95594195]
[0.05369205]]
import numpy as np
import pandas as pd

data=pd.read_csv("spam.csv")
data.head(5)
data['Category'] = data['Category'].map({'spam': 1, 'ham': 0})
#checks for null values and prints its count
print(data.isnull().sum())
#drops NaN values
data.dropna(inplace=True)
#get count of duplicate values
print(data.duplicated().sum())
data.drop_duplicates(inplace=True)
from sklearn.feature_extraction.text import CountVectorizer
vectorizer = CountVectorizer()
X = vectorizer.fit_transform(data['Message'])
from sklearn.model_selection import train_test_split
y = data['Category']
X_train, X_test, y_train, y_test =
train_test_split(X,y,test_size=0.2,random_state=42,stratify=y)
from sklearn.naive_bayes import MultinomialNB
from sklearn.metrics import accuracy_score
nb_model = MultinomialNB(alpha=1.0)
nb_model.fit(X_train, y_train)
y_pred = nb_model.predict(X_test)

accuracy = accuracy_score(y_test, y_pred)

print("Accuracy:", accuracy)

from sklearn.metrics import confusion_matrix

import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
cm = confusion_matrix(y_test, y_pred)
cm_df = pd.DataFrame(cm, index=['Actual Ham (0)', 'Actual Spam (1)'],
columns=['Predicted Ham (0)', 'Predicted Spam (1)'])
print("Confusion Matrix:\n", cm_df)
from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score
accuracy = accuracy_score(y_test, y_pred)
precision = precision_score(y_test, y_pred)
recall = recall_score(y_test, y_pred)
f1 = f1_score(y_test, y_pred)

print(f"\nAccuracy: {accuracy:.4f}")
print(f"Precision: {precision:.4f}")
print(f"Recall: {recall:.4f}")
print(f"F1-Score: {f1:.4f}")

plt.figure(figsize=(6, 5))
sns.heatmap(cm_df, annot=True, fmt='d', cmap='Blues', cbar=False)
plt.title('Confusion Matrix')
plt.ylabel('Actual Label')
plt.xlabel('Predicted Label')
plt.show()

Output:

Categor Message
y

0 ham Go until jurong point, crazy.. Available only ...

1 ham Ok lar... Joking wif u oni...

2 spam Free entry in 2 a wkly comp to win FA Cup fina...

3 ham U dun say so early hor... U c already then say...

ham Nah I don't think he goes to usf, he lives aro...

Category 0
Message 0
dtype: int64

415
Accuracy: 0.9728682170542635

Confusion Matrix:
Predicted Ham (0) Predicted Spam (1)
Actual Ham (0) 887 17
Actual Spam (1) 11 117

Accuracy: 0.9729
Precision: 0.8731
Recall: 0.9141
F1-Score: 0.8931
import pandas as pd
df=pd.read_csv("Iris.csv")
df.head()
X = df.drop('Species', axis=1)
X.head()
from sklearn.cluster import KMeans
# Apply K-Means Clustering with n_clusters = 3
kmeans = KMeans(n_clusters=3, random_state=42, n_init=10)
kmeans.fit(X)

labels = kmeans.labels_ # Get the cluster labels

df['Cluster'] = labels
df.head()
import matplotlib.pyplot as plt

plt.figure(figsize=(8, 6))
scatter = plt.scatter(df['PetalLengthCm'], df['PetalWidthCm'], c=df['Cluster'], cmap='viridis',
marker='o')
plt.title('K-Means Clustering on Iris Dataset (Petal Length vs Petal Width)')
plt.xlabel('PetalLengthCm')
plt.ylabel('PetalWidthCm')
plt.colorbar(label='Cluster')
plt.grid(True)

legend_elements = [plt.scatter([], [], marker='o', color=scatter.to_rgba(label), label=f'Cluster

{label}') for label in sorted(df['Cluster'].unique())]
plt.legend(handles=legend_elements, title='Clusters')

plt.show()
cross_tab = pd.crosstab(df['Species'], df['Cluster'])
display(cross_tab)
Output:
Id SepalLength SepalWidth PetalLengthC PetalWidthC Specie
Cm Cm m m s

0 1 5.1 3.5 1.4 0.2 Iris-setosa

1 2 4.9 3.0 1.4 0.2 Iris-setosa

2 3 4.7 3.2 1.3 0.2 Iris-setosa

3 4 4.6 3.1 1.5 0.2 Iris-setosa

5 5.0 3.6 1.4 0.2 Iris-setosa

Id SepalLength SepalWidth PetalLengthC PetalWidthC

Cm Cm m m

0 1 5.1 3.5 1.4 0.2

1 2 4.9 3.0 1.4 0.2

2 3 4.7 3.2 1.3 0.2

3 4 4.6 3.1 1.5 0.2

5 5.0 3.6 1.4 0.2

Id SepalLengthC SepalWidthC PetalLengthC PetalWidthC Species Cluster

m m m m

1 5.1 3.5 1.4 0.2 Iris-seto 2

0
sa

2 4.9 3.0 1.4 0.2 Iris-seto 2

1
sa

3 4.7 3.2 1.3 0.2 Iris-seto 2

2
sa

4 4.6 3.1 1.5 0.2 Iris-seto 2

3
sa

5 5.0 3.6 1.4 0.2 Iris-seto 2

4
sa
Cluster 0 1 2

Species

Iris-setosa 1 0 49

Iris-versicolor 49 1 0

0 50 0
Iris-virginica
import pandas as pd
df = pd.read_csv('/content/species_dataset.csv')
df.head()
from sklearn.tree import DecisionTreeClassifier, plot_tree
from sklearn.preprocessing import OneHotEncoder
import matplotlib.pyplot as plt
X = df.drop('species', axis=1)
y = df['species']
encoder = OneHotEncoder(handle_unknown='ignore', sparse_output=False)
X_encoded = encoder.fit_transform(X)
feature_names = encoder.get_feature_names_out(X.columns)
model = DecisionTreeClassifier(criterion='entropy', random_state=42)
model.fit(X_encoded, y)
plt.figure(figsize=(15, 10))
plot_tree(model,
feature_names=feature_names,
class_names=model.classes_,
filled=True,
rounded=True,
proportion=True,
fontsize=10)
plt.title("Decision Tree (ID3-like) for Species Classification")
plt.show()
Output:
Toothe Hair Breathes Legs species
d

Toothed Hair Breathe Legs Mammal

0
s

Toothed Hair Breathe Legs Mammal

1
s

Toothed Hair Breathe Legs Mammal

2
s

Toothed Not Hair Breathe Not Reptile

3
s Legs

Not Hair Breathe Legs Mammal

4
Toothed s

22MCA1008 - Varun ML LAB ASSIGNMENTS
100% (1)
22MCA1008 - Varun ML LAB ASSIGNMENTS
41 pages
ML L - Ab
No ratings yet
ML L - Ab
13 pages
ML
No ratings yet
ML
11 pages
1 10
No ratings yet
1 10
4 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
IRis
No ratings yet
IRis
19 pages
EX - NO:3: Algorithm
No ratings yet
EX - NO:3: Algorithm
11 pages
ML Lab Experiment Shortened With Same Output
No ratings yet
ML Lab Experiment Shortened With Same Output
6 pages
1
No ratings yet
1
13 pages
Machine Learning
No ratings yet
Machine Learning
14 pages
ML Codes
No ratings yet
ML Codes
9 pages
Python ML Algorithms Guide
No ratings yet
Python ML Algorithms Guide
7 pages
Chittiii
No ratings yet
Chittiii
2 pages
Dsbda Assig 6 Data Analytcs 3
No ratings yet
Dsbda Assig 6 Data Analytcs 3
6 pages
Ai Int-1
No ratings yet
Ai Int-1
6 pages
Import As Import As Import As Import As From Import
No ratings yet
Import As Import As Import As Import As From Import
3 pages
3 Classification
No ratings yet
3 Classification
16 pages
Aiml Ex 4-7
No ratings yet
Aiml Ex 4-7
8 pages
Advanced Machine Learniing Lab Manual
No ratings yet
Advanced Machine Learniing Lab Manual
10 pages
All in One
No ratings yet
All in One
13 pages
Keras Lab With Output
No ratings yet
Keras Lab With Output
22 pages
Final ML Programs 075005
No ratings yet
Final ML Programs 075005
15 pages
Decision Tree
No ratings yet
Decision Tree
2 pages
Disease Prediction with Machine Learning
No ratings yet
Disease Prediction with Machine Learning
573 pages
AI&ML
No ratings yet
AI&ML
9 pages
Aml Lab
No ratings yet
Aml Lab
6 pages
Medical Data ML
No ratings yet
Medical Data ML
6 pages
ML5 Implementation
No ratings yet
ML5 Implementation
32 pages
ML Lab Manual
No ratings yet
ML Lab Manual
12 pages
ML Lab Programs
No ratings yet
ML Lab Programs
23 pages
I Avaliação Parcial - 25.0 PTS - Gabarito
No ratings yet
I Avaliação Parcial - 25.0 PTS - Gabarito
9 pages
Data Analytics
No ratings yet
Data Analytics
10 pages
Bacdeaf 23032025 115708 Split 1
No ratings yet
Bacdeaf 23032025 115708 Split 1
37 pages
ML Functions
No ratings yet
ML Functions
12 pages
Dsbda 10
No ratings yet
Dsbda 10
5 pages
ML Lab
No ratings yet
ML Lab
10 pages
Lab Da 3 22BCE3370
No ratings yet
Lab Da 3 22BCE3370
9 pages
TranMinhTu1 bt2 2
No ratings yet
TranMinhTu1 bt2 2
5 pages
ML Lab P-1
No ratings yet
ML Lab P-1
10 pages
ML Yogesh
No ratings yet
ML Yogesh
23 pages
23BCE7092 ML Lab Assignment
No ratings yet
23BCE7092 ML Lab Assignment
14 pages
SVM and Kmeans - Iris Dataset - Ipynb - Colab
No ratings yet
SVM and Kmeans - Iris Dataset - Ipynb - Colab
5 pages
AI ML - Cycle 2 Programs
No ratings yet
AI ML - Cycle 2 Programs
15 pages
Iris Dataset EDA and ML Models
No ratings yet
Iris Dataset EDA and ML Models
17 pages
1 Kmeans
No ratings yet
1 Kmeans
6 pages
19mid0034 (Chandru) - ML Lab Fat - Jupyter Notebook
No ratings yet
19mid0034 (Chandru) - ML Lab Fat - Jupyter Notebook
4 pages
PYHTONPRACT
No ratings yet
PYHTONPRACT
4 pages
23BCE7199 ML Lab Assignment
No ratings yet
23BCE7199 ML Lab Assignment
15 pages
Remaining ML Program
No ratings yet
Remaining ML Program
12 pages
MLL
No ratings yet
MLL
2 pages
Practical A I
No ratings yet
Practical A I
22 pages
Ashwin Report
No ratings yet
Ashwin Report
18 pages
Prakhar - Week 5
No ratings yet
Prakhar - Week 5
8 pages
Programs Lab Bca
No ratings yet
Programs Lab Bca
16 pages
ML Practice
No ratings yet
ML Practice
10 pages
Prathamesh KRAI
No ratings yet
Prathamesh KRAI
38 pages
Neeraj Bapna
No ratings yet
Neeraj Bapna
1 page
Updated CHAPTER - 2 Statistical Learning
No ratings yet
Updated CHAPTER - 2 Statistical Learning
52 pages
(Ebook) Principles of Soft Computing Using Python Programming by Gypsy Nandi ISBN 9781394173136, 139417313X Online PDF
No ratings yet
(Ebook) Principles of Soft Computing Using Python Programming by Gypsy Nandi ISBN 9781394173136, 139417313X Online PDF
81 pages
ECG Classification For Detecting ECG Arrhythmia Empowered With Deep Learning Approaches
No ratings yet
ECG Classification For Detecting ECG Arrhythmia Empowered With Deep Learning Approaches
1 page
Toonify Your World Draft
No ratings yet
Toonify Your World Draft
3 pages
EfficientViT Enhanced Linear Attention For High-Re
No ratings yet
EfficientViT Enhanced Linear Attention For High-Re
15 pages
From Text To Truth: Leveraging Indobert and Machine Learning Models For Hoax Detection in Indonesian News
No ratings yet
From Text To Truth: Leveraging Indobert and Machine Learning Models For Hoax Detection in Indonesian News
12 pages
M.tech Final - Thesis-Anuj Kumar
No ratings yet
M.tech Final - Thesis-Anuj Kumar
47 pages
Rao Et Al. - 2018 - A Survey On Prevention of Overfitting in Convolution Neural Networks Using Machine Learning Techniques
No ratings yet
Rao Et Al. - 2018 - A Survey On Prevention of Overfitting in Convolution Neural Networks Using Machine Learning Techniques
4 pages
10th - AI - SA-1 - KEY ANS
No ratings yet
10th - AI - SA-1 - KEY ANS
7 pages
IBM Skills Build Use Cases AI
No ratings yet
IBM Skills Build Use Cases AI
1 page
Unit 5 Computer Vision
No ratings yet
Unit 5 Computer Vision
4 pages
ViTAU：基于Vision transformer和面部动作单元的面瘫识别与分析
No ratings yet
ViTAU：基于Vision transformer和面部动作单元的面瘫识别与分析
14 pages
Indian ANPR Documentation
No ratings yet
Indian ANPR Documentation
2 pages
Chat GTP
No ratings yet
Chat GTP
5 pages
Artificial Intelligence-Based Techniques For Adulteration and Defect Detections in Food and Agrcultural Industtry Review
No ratings yet
Artificial Intelligence-Based Techniques For Adulteration and Defect Detections in Food and Agrcultural Industtry Review
15 pages
Machine Learning For iOS Developers 1st Edition Abhishek Mishra Full Chapters Included
No ratings yet
Machine Learning For iOS Developers 1st Edition Abhishek Mishra Full Chapters Included
86 pages
Predictive Models For AI
No ratings yet
Predictive Models For AI
19 pages
Yadav 2021
No ratings yet
Yadav 2021
25 pages
Begrading: Large Language Models For Enhanced Feedback in Programming Education
No ratings yet
Begrading: Large Language Models For Enhanced Feedback in Programming Education
14 pages
Gen AI Databricks Simplified Notes
No ratings yet
Gen AI Databricks Simplified Notes
3 pages
Synthetic Prior For Few-Shot Drivable Head Avatar Inversion
No ratings yet
Synthetic Prior For Few-Shot Drivable Head Avatar Inversion
23 pages
Deep Learnig Total Unit1
No ratings yet
Deep Learnig Total Unit1
26 pages
Unit 1
No ratings yet
Unit 1
5 pages
6.86x Courseware - EdX Page 2
No ratings yet
6.86x Courseware - EdX Page 2
9 pages
Machine Learning
No ratings yet
Machine Learning
57 pages
SVM Implementation in Python From Scratch - Step by Step Guide in 2024
No ratings yet
SVM Implementation in Python From Scratch - Step by Step Guide in 2024
8 pages
Unit2 3 Sample Question Bank
No ratings yet
Unit2 3 Sample Question Bank
2 pages
Utilizing Graph Neural Networks For Breast Cancer Prognosis Prediction With High-Dimensional Genomic Data
No ratings yet
Utilizing Graph Neural Networks For Breast Cancer Prognosis Prediction With High-Dimensional Genomic Data
4 pages

Ailab 2

Uploaded by

Ailab 2

Uploaded by

import pandas as pd

# Define y_test and y_pred

# Calculate confusion matrix

for epoch in range(epoch):

Ij_output=np.dot(Oj_hidden,W2) #net input of output layer

#error at output layer

#error at hidden layer

#print error occasionally

accuracy = accuracy_score(y_test, y_pred)

from sklearn.metrics import confusion_matrix

0 ham Go until jurong point, crazy.. Available only ...

1 ham Ok lar... Joking wif u oni...

2 spam Free entry in 2 a wkly comp to win FA Cup fina...

3 ham U dun say so early hor... U c already then say...

ham Nah I don't think he goes to usf, he lives aro...

labels = kmeans.labels_ # Get the cluster labels

legend_elements = [plt.scatter([], [], marker='o', color=scatter.to_rgba(label), label=f'Cluster

0 1 5.1 3.5 1.4 0.2 Iris-setosa

1 2 4.9 3.0 1.4 0.2 Iris-setosa

2 3 4.7 3.2 1.3 0.2 Iris-setosa

3 4 4.6 3.1 1.5 0.2 Iris-setosa

5 5.0 3.6 1.4 0.2 Iris-setosa

Id SepalLength SepalWidth PetalLengthC PetalWidthC

0 1 5.1 3.5 1.4 0.2

1 2 4.9 3.0 1.4 0.2

2 3 4.7 3.2 1.3 0.2

3 4 4.6 3.1 1.5 0.2

5 5.0 3.6 1.4 0.2

Id SepalLengthC SepalWidthC PetalLengthC PetalWidthC Species Cluster

1 5.1 3.5 1.4 0.2 Iris-seto 2

2 4.9 3.0 1.4 0.2 Iris-seto 2

3 4.7 3.2 1.3 0.2 Iris-seto 2

4 4.6 3.1 1.5 0.2 Iris-seto 2

5 5.0 3.6 1.4 0.2 Iris-seto 2

Toothed Hair Breathe Legs Mammal

Toothed Hair Breathe Legs Mammal

Toothed Hair Breathe Legs Mammal

Toothed Not Hair Breathe Not Reptile

Not Hair Breathe Legs Mammal

You might also like