0% found this document useful (0 votes)

13 views6 pages

Python KNN

The document provides Python code for implementing the K-Nearest Neighbors (KNN) algorithm, including functions for loading data, converting data types, normalizing datasets, calculating Euclidean distance, and making predictions. It specifically demonstrates how to predict the class of a new record using the Iris dataset. The code includes detailed steps for data preprocessing and neighbor identification to facilitate classification.

Uploaded by

bachanpriya20

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

13 views6 pages

Python KNN

Uploaded by

bachanpriya20

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 6

KNN: Python Code

-Priya R. Bachan, Rishika

Code

from csv import reader

from math import sqrt

# Load a CSV file

def load_csv(filename):

dataset = list()

with open(filename, 'r') as file:

csv_reader = reader(file)

for row in csv_reader:

if not row:

continue

dataset.append(row)

return dataset

# Convert string column to float

def str_column_to_float(dataset, column):

for row in dataset:

row[column] = float(row[column].strip())

# Convert string column to integer

def str_column_to_int(dataset, column):

class_values = [row[column] for row in dataset]

unique = set(class_values)

lookup = dict()

for i, value in enumerate(unique):

lookup[value] = i

print('[%s] => %d' % (value, i))

for row in dataset:

row[column] = lookup[row[column]]

return lookup

# Find the min and max values for each column

def dataset_minmax(dataset):

minmax = list()

for i in range(len(dataset[0])):

col_values = [row[i] for row in dataset]

value_min = min(col_values)

value_max = max(col_values)

minmax.append([value_min, value_max])

return minmax

# Rescale dataset columns to the range 0-1

def normalize_dataset(dataset, minmax):

for row in dataset:

for i in range(len(row)):

row[i] = (row[i] - minmax[i][0]) / (minmax[i][1] - minmax[i][0])

# Calculate the Euclidean distance between two vectors

def euclidean_distance(row1, row2):

distance = 0.0

for i in range(len(row1)-1):

distance += (row1[i] - row2[i])**2

return sqrt(distance)

# Locate the most similar neighbors

def get_neighbors(train, test_row, num_neighbors):

distances = list()

for train_row in train:

dist = euclidean_distance(test_row, train_row)

distances.append((train_row, dist))

distances.sort(key=lambda tup: tup[1])

neighbors = list()

for i in range(num_neighbors):

neighbors.append(distances[i][0])

return neighbors

# Make a prediction with neighbors

def predict_classification(train, test_row, num_neighbors):

neighbors = get_neighbors(train, test_row, num_neighbors)

output_values = [row[-1] for row in neighbors]

prediction = max(set(output_values), key=output_values.count)

return prediction

# Make a prediction with KNN on Iris Dataset

filename = 'iris.csv'

dataset = load_csv(filename)

for i in range(len(dataset[0])-1):

str_column_to_int(dataset, i)

# convert class column to integers

str_column_to_int(dataset, len(dataset[0])-1)

# define model parameter

num_neighbors = 5

# define a new record

row = [5.7,2.9,4.2,1.3]

# predict the label

label = predict_classification(dataset, row, num_neighbors)

print('Data=%s, Predicted: %s' % (row, label))

output
[5.3] => 0
[4.8] => 1
[7.6] => 2
[7.4] => 3
[6.8] => 4
[5.7] => 5
[6.1] => 6
[7.2] => 7
[4.6] => 8
[5.4] => 9
[4.7] => 10
[7] => 11
[4.3] => 12
[6.4] => 13
[5.6] => 14
[6.6] => 15
[7.9] => 16
[5.1] => 17
[sepal.length] => 18
[7.3] => 19
[6] => 20
[4.5] => 21
[6.9] => 22
[6.2] => 23
[4.4] => 24
[7.7] => 25
[6.7] => 26
[5.2] => 27
[5.9] => 28
[4.9] => 29
[6.3] => 30
[7.1] => 31
[6.5] => 32
[5] => 33
[5.8] => 34
[5.5] => 35
[3.4] => 0
[3.8] => 1
[2.2] => 2
[2.9] => 3
[2.8] => 4
[3.9] => 5
[3] => 6
[2] => 7
[2.3] => 8
[sepal.width] => 9
[3.1] => 10
[4] => 11
[4.1] => 12
[3.6] => 13
[4.4] => 14
[2.7] => 15
[2.6] => 16
[3.5] => 17
[4.2] => 18
[2.5] => 19
[3.2] => 20
[3.3] => 21
[3.7] => 22
[2.4] => 23
[3.8] => 0
[5.3] => 1
[1.9] => 2
[1] => 3
[4.8] => 4
[3.9] => 5
[5.7] => 6
[6.1] => 7
[3] => 8
[4.6] => 9
[1.1] => 10
[5.4] => 11
[4.7] => 12
[4.3] => 13
[5.6] => 14
[6.4] => 15
[6.6] => 16
[1.4] => 17
[1.6] => 18
[5.1] => 19
[1.7] => 20
[4] => 21
[6] => 22
[4.1] => 23
[4.5] => 24
[6.9] => 25
[1.5] => 26
[3.6] => 27
[4.4] => 28
[1.3] => 29
[6.7] => 30
[5.2] => 31
[3.5] => 32
[4.2] => 33
[3.3] => 34
[5.9] => 35
[4.9] => 36
[1.2] => 37
[petal.length] => 38
[3.7] => 39
[6.3] => 40
[5] => 41
[5.8] => 42
[5.5] => 43
[petal.width] => 0
[2.2] => 1
[2.1] => 2
[1.9] => 3
[0.5] => 4
[1] => 5
[0.6] => 6
[0.4] => 7
[1.1] => 8
[1.4] => 9
[1.6] => 10
[2] => 11
[2.3] => 12
[1.7] => 13
[0.1] => 14
[0.2] => 15
[1.5] => 16
[1.3] => 17
[2.5] => 18
[1.8] => 19
[0.3] => 20
[1.2] => 21
[2.4] => 22
[Setosa] => 0
[Versicolor] => 1
[Virginica] => 2
[variety] => 3
[] => 0
[] => 0
[] => 0
[] => 0
[] => 0
[] => 0
[] => 0
[] => 0
[] => 0
[] => 0
[] => 0
[] => 0
[] => 0
[] => 0
[5.4] => 1
[sepal.length] => 2
[5.8] => 3
[5.2] => 4
[3.5] => 0
[] => 1
[3] => 2
[2.7] => 3
[sepal.width] => 4
[] => 0
[4.5] => 1
[petal.length] => 2
[1.5] => 3
[5.1] => 4
[] => 0
[petal.width] => 1
[1.9] => 2
[0.2] => 3
[1.5] => 4
[] => 0
[?] => 1
[variety] => 2
Data=[5.7, 2.9, 4.2, 1.3], Predicted: 0

ML#07
No ratings yet
ML#07
21 pages
KNN - Jupyter Notebook
No ratings yet
KNN - Jupyter Notebook
8 pages
ML Lab Programs
No ratings yet
ML Lab Programs
23 pages
2 - 9 - KNN Code
No ratings yet
2 - 9 - KNN Code
6 pages
Week 6 K Nearestneighbors 1
No ratings yet
Week 6 K Nearestneighbors 1
11 pages
K-NN Algorithm: Need To Create Two Files File 1: KNN - Py Second File: Expt3.py
No ratings yet
K-NN Algorithm: Need To Create Two Files File 1: KNN - Py Second File: Expt3.py
4 pages
Practical 5
No ratings yet
Practical 5
11 pages
7 Output
No ratings yet
7 Output
4 pages
DS Report
No ratings yet
DS Report
11 pages
Machine Learning All Lab Experiments VTU 6th Sem
No ratings yet
Machine Learning All Lab Experiments VTU 6th Sem
27 pages
ML Labmanual
No ratings yet
ML Labmanual
33 pages
TranMinhTu1 bt2 2
No ratings yet
TranMinhTu1 bt2 2
5 pages
KNN and K-Means with Iris Dataset
No ratings yet
KNN and K-Means with Iris Dataset
6 pages
Implementing KNN Algorithm On The Iris Dataset
No ratings yet
Implementing KNN Algorithm On The Iris Dataset
7 pages
Iris Dataset Analysis with KNN & K-Means
No ratings yet
Iris Dataset Analysis with KNN & K-Means
6 pages
KNN Model Find Optimanl K
No ratings yet
KNN Model Find Optimanl K
3 pages
SC Assignment Q2
No ratings yet
SC Assignment Q2
7 pages
Python ML Algorithms Guide
No ratings yet
Python ML Algorithms Guide
7 pages
Lab7.ipynb - Colaboratory
100% (1)
Lab7.ipynb - Colaboratory
5 pages
DSM 2
No ratings yet
DSM 2
7 pages
KNN ALGORITHM - Ipynb - Colab
No ratings yet
KNN ALGORITHM - Ipynb - Colab
4 pages
ML Lab 1-5
No ratings yet
ML Lab 1-5
5 pages
Lab Manual ML
No ratings yet
Lab Manual ML
23 pages
Lab4 KNN
No ratings yet
Lab4 KNN
9 pages
ML Short Code - Under Updating
No ratings yet
ML Short Code - Under Updating
4 pages
Assignment #1: K Nearest Neighbor Classifier: Name: Srikanth Mujjiga (Roll No: 2015-50-831
No ratings yet
Assignment #1: K Nearest Neighbor Classifier: Name: Srikanth Mujjiga (Roll No: 2015-50-831
8 pages
KNN Classification on Iris Dataset
No ratings yet
KNN Classification on Iris Dataset
3 pages
KNN - Predictive Analysis
No ratings yet
KNN - Predictive Analysis
6 pages
Lab06 KNN 01
No ratings yet
Lab06 KNN 01
3 pages
L6 Tutorial - KNN - Jupyter Notebook
No ratings yet
L6 Tutorial - KNN - Jupyter Notebook
7 pages
Aiml Lab
No ratings yet
Aiml Lab
14 pages
Logistic Regression on Iris Dataset
No ratings yet
Logistic Regression on Iris Dataset
7 pages
Lab Extern L
No ratings yet
Lab Extern L
8 pages
DSBDA6
No ratings yet
DSBDA6
6 pages
It - S All About Neighbors - Completed
No ratings yet
It - S All About Neighbors - Completed
14 pages
Week 6 (PCA, SVD, LDA)
No ratings yet
Week 6 (PCA, SVD, LDA)
14 pages
03 - K Means Clustering On Iris Datasets
No ratings yet
03 - K Means Clustering On Iris Datasets
4 pages
L3 - Classification - RandomForest - Jupyter Notebook
No ratings yet
L3 - Classification - RandomForest - Jupyter Notebook
6 pages
Assignment 5'
No ratings yet
Assignment 5'
4 pages
TASK01 IrisFlowerClassificationwithMachineLearning 1752340862
No ratings yet
TASK01 IrisFlowerClassificationwithMachineLearning 1752340862
3 pages
Aids - ML - B3 - 74 - Assi 1
No ratings yet
Aids - ML - B3 - 74 - Assi 1
6 pages
Program 4
No ratings yet
Program 4
3 pages
Assignment No 2 AI
No ratings yet
Assignment No 2 AI
4 pages
DMT Cia2
No ratings yet
DMT Cia2
11 pages
Titanic Shuffle Analysis in ML Lab
No ratings yet
Titanic Shuffle Analysis in ML Lab
24 pages
MLLab Manual
No ratings yet
MLLab Manual
24 pages
ML Practice
No ratings yet
ML Practice
10 pages
Lecture 12 K-Nearest Neighbors
No ratings yet
Lecture 12 K-Nearest Neighbors
24 pages
Rahul Raj - Ipynb - Colab
No ratings yet
Rahul Raj - Ipynb - Colab
50 pages
DSE 6 - Colab
No ratings yet
DSE 6 - Colab
5 pages
Machine Learning Lab Manual
No ratings yet
Machine Learning Lab Manual
9 pages
KNN Datacamp
No ratings yet
KNN Datacamp
31 pages
Mlalllabprgs
No ratings yet
Mlalllabprgs
17 pages
Machine Learning Lab Manual
No ratings yet
Machine Learning Lab Manual
26 pages
Lab4 23cs142
No ratings yet
Lab4 23cs142
2 pages
KNN Distance Calculation Explained
No ratings yet
KNN Distance Calculation Explained
14 pages
V
No ratings yet
V
8 pages
ML Four To Eight
No ratings yet
ML Four To Eight
3 pages
Canara WP BusinessCaseForMonitoring
No ratings yet
Canara WP BusinessCaseForMonitoring
12 pages
Ethics in Information Systems
No ratings yet
Ethics in Information Systems
41 pages
Internet Connectivity Financial Offer To MD (Goni Group)
No ratings yet
Internet Connectivity Financial Offer To MD (Goni Group)
7 pages
Casey Wang Reesume
No ratings yet
Casey Wang Reesume
2 pages
JRC Jue-75c
No ratings yet
JRC Jue-75c
175 pages
Lec 5 Image Processing
No ratings yet
Lec 5 Image Processing
103 pages
FL4000H Flame Detector Overview
No ratings yet
FL4000H Flame Detector Overview
4 pages
Ai in Road Safety
No ratings yet
Ai in Road Safety
4 pages
Tourism System Project Report
No ratings yet
Tourism System Project Report
46 pages
Internet Manual
No ratings yet
Internet Manual
11 pages
Text Preprocessing Techniques for NLP
No ratings yet
Text Preprocessing Techniques for NLP
3 pages
Aash Education Pvt. Ltd. Aash Education Pvt. LTD.: Computer
No ratings yet
Aash Education Pvt. Ltd. Aash Education Pvt. LTD.: Computer
22 pages
Basic Design Using Rtos
No ratings yet
Basic Design Using Rtos
12 pages
Software Engg Lab Manual
No ratings yet
Software Engg Lab Manual
35 pages
Quantum Computing for MIS Students
No ratings yet
Quantum Computing for MIS Students
10 pages
Evidence Property Insurance PDF
No ratings yet
Evidence Property Insurance PDF
2 pages
Understanding Logistic Regression Basics
No ratings yet
Understanding Logistic Regression Basics
8 pages
Digital System Design Course Overview
No ratings yet
Digital System Design Course Overview
2 pages
(2020129) On Layer Normalization in The Transformer Architecture
No ratings yet
(2020129) On Layer Normalization in The Transformer Architecture
17 pages
AZ 700T00A ENU PowerPoint - 04
No ratings yet
AZ 700T00A ENU PowerPoint - 04
42 pages
Create a Gmail Connector for Vantage
No ratings yet
Create a Gmail Connector for Vantage
18 pages
TCL Scripting
No ratings yet
TCL Scripting
81 pages
A Study On 3D Printer Design With Con Veyor in Industrial Applications
No ratings yet
A Study On 3D Printer Design With Con Veyor in Industrial Applications
19 pages
Coal - Lab Sol, 4
No ratings yet
Coal - Lab Sol, 4
7 pages
3d Printing Term Paper
50% (2)
3d Printing Term Paper
4 pages
Brain Tumor Detection and Classification Using Intelligence Techniques An Overview
No ratings yet
Brain Tumor Detection and Classification Using Intelligence Techniques An Overview
17 pages
Kishore Icet
No ratings yet
Kishore Icet
2 pages
Device Communication Protocol Guide
No ratings yet
Device Communication Protocol Guide
82 pages
Revised Syllabus Data Science 10 Weeks
No ratings yet
Revised Syllabus Data Science 10 Weeks
2 pages
User Manual BM115 3.0 - 6 12KW Auto Focusing Laser Cutting Head - V3.0 PDF
No ratings yet
User Manual BM115 3.0 - 6 12KW Auto Focusing Laser Cutting Head - V3.0 PDF
26 pages

Python KNN

Uploaded by

Python KNN

Uploaded by

KNN: Python Code

-Priya R. Bachan, Rishika

from csv import reader

from math import sqrt

# Load a CSV file

with open(filename, 'r') as file:

for row in csv_reader:

# Convert string column to float

def str_column_to_float(dataset, column):

for row in dataset:

# Convert string column to integer

def str_column_to_int(dataset, column):

class_values = [row[column] for row in dataset]

for i, value in enumerate(unique):

print('[%s] => %d' % (value, i))

# Find the min and max values for each column

col_values = [row[i] for row in dataset]

# Rescale dataset columns to the range 0-1

def normalize_dataset(dataset, minmax):

for row in dataset:

row[i] = (row[i] - minmax[i][0]) / (minmax[i][1] - minmax[i][0])

# Calculate the Euclidean distance between two vectors

def euclidean_distance(row1, row2):

distance += (row1[i] - row2[i])**2

# Locate the most similar neighbors

def get_neighbors(train, test_row, num_neighbors):

for train_row in train:

distances.sort(key=lambda tup: tup[1])

# Make a prediction with neighbors

def predict_classification(train, test_row, num_neighbors):

neighbors = get_neighbors(train, test_row, num_neighbors)

output_values = [row[-1] for row in neighbors]

prediction = max(set(output_values), key=output_values.count)

# Make a prediction with KNN on Iris Dataset

# convert class column to integers

# define model parameter

# define a new record

# predict the label

label = predict_classification(dataset, row, num_neighbors)

print('Data=%s, Predicted: %s' % (row, label))

You might also like