0% found this document useful (0 votes)

29 views8 pages

Prakhar - Week 5

The document contains a lab assignment for data mining and web algorithms, featuring implementations of K-Nearest Neighbors (KNN), Naive Bayes, and Decision Tree algorithms in Python. It includes code for calculating distances, fitting models, making predictions, and evaluating accuracy using the Iris dataset. The assignment concludes with a test of the Decision Tree model on sample data with predictions and accuracy output.

Uploaded by

xonab72362

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

29 views8 pages

Prakhar - Week 5

Uploaded by

xonab72362

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 8

DATA MINING & WEB ALGORITHMS LAB

Assignment: Week 5

Ans 1. import math

import pandas as pd
def distance(u1, u2):
distance = 0
for i in range(len(u1)):
distance += (u1[i] - u2[i]) ** 2
return math.sqrt(distance)

def fun(data):
m=[[0]*(len(data)) for i in range(len(data))]
for i in range(1,len(data)):
for j in range(1,len(data)):
m[i][j]=distance(data.loc[i],data.loc[j])
return m

data=pd.read_csv('1.csv')
m=fun(data)
print(m)

Output:
-
Ans 2.
import pandas as pd
import numpy as np
import math
import scipy.spatial.distance
from collections import Counter
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split

class KNN:
def __init__(self,k):
self.k=k

def fit(self,X_train,y_train):
self.X_train=X_train
self.y_train=y_train

def predict(self,X_test):
y_pred=[]
for x in X_test:
distances=[np.linalg.norm(x-x_train) for x_train in
self.X_train]
k_neighbors=np.argsort(distances)[:self.k]
k_labels=[self.y_train[i] for i in k_neighbors]
k_neighbors=np.argsort(distances)[:self.k]
k_labels=[self.y_train[i] for i in k_neighbors]
y_pred.append(max(set(k_labels),
key=k_labels.count))
return np.array(y_pred)

def score(self,X_test,y_test):
predictions=self.predict(X_test)
return (predictions==y_test).sum()/len(y_test)

class NaiveBayes:
def fit(self,X,y):
self.classes=np.unique(y)
self.priors={c: np.mean(y==c) for c in self.classes}
self.means={c: np.mean(X[y == c],axis=0) for c in
self.classes}
self.variances={c: np.var(X[y == c], axis=0)+1e-6 for
c in self.classes}

def predict(self, X_test):

y_pred=[]
for x in X_test:
p={}
for c in self.classes:
likelihood = np.prod(1
/np.sqrt(2*np.pi*self.variances[c])*np.exp(-(x-
self.means[c])**2/(2*self.variances[c])))
p[c]=self.priors[c]*likelihood
y_pred.append(max(p, key=p.get))
return np.array(y_pred)

def score(self,X_test,y_test):
predictions=self.predict(X_test)
return (predictions==y_test).sum()/len(y_test)

iris=load_iris()
iris=load_iris()
X_train,X_test,y_train,y_test=train_test_split(iris.data,iris.t
arget,random_state=42,test_size=0.2)

# KNN
knn= KNN(3)
knn.fit(X_train,y_train)
knn_r=knn.predict(X_test)
accuracyknn=knn.score(X_test,y_test)
print(f"KNN Accuracy: {accuracyknn:.4f}")

# Naive Bayes
nb=NaiveBayes()
nb.fit(X_train,y_train)
nb_r=nb.predict(X_test)
accuracynb=nb.score(X_test,y_test)
print(f"Naive Bayes Accuracy: {accuracynb:.4f}")

Output:
-
Ans 3. class DecisionTreeID3:
def __init__(self, depth=3):
self.depth = depth

def _entropy(self, y):

values, counts = np.unique(y, return_counts=True)
prob = counts / len(y)
return -np.sum(prob * np.log2(prob + 1e-6))

def _info_gain(self, X, y, feature_idx):

total_entropy = self._entropy(y)
values, counts = np.unique(X[:, feature_idx],
return_counts=True)
weighted_entropy = np.sum([(counts[i] / len(X)) *
self._entropy(y[X[:, feature_idx] == values[i]]) for i in
range(len(values))])
return total_entropy - weighted_entropy

def _best_split(self, X, y):

gains = [self._info_gain(X, y, i) for i in
range(X.shape[1])]
return np.argmax(gains)

def _build_tree(self, X, y, depth=0):

if len(set(y)) == 1 or depth == self.depth:
return y[0]
feature_idx = self._best_split(X, y)
tree = {feature_idx: {}}
for value in np.unique(X[:, feature_idx]):
mask = X[:, feature_idx] == value
tree[feature_idx][value] = self._build_tree(X[mask],
y[mask], depth + 1)
return tree

def fit(self, X, y):

self.tree = self._build_tree(X, y)
def fit(self, X, y):
self.tree = self._build_tree(X, y)

def predict(self, X):

return np.array([self._predict_one(x, self.tree) for x in
X])

def _predict_one(self, x, tree):

if not isinstance(tree, dict):
return tree
feature_idx = list(tree.keys())[0]
return self._predict_one(x,
tree[feature_idx].get(x[feature_idx], -1))

def score(self, X_test, y_test):

predictions = self.predict(X_test)
return (predictions == y_test).mean()

tree = DecisionTreeID3(depth=3)
tree.fit(X, y)
test_samples = [
{'Branch': 'CSE', 'CGPA': 'Low', 'Gamer': 'Yes', 'Movie
Fanatic': 'No', 'Committed?': 'Yes'},
{'Branch': 'ECE', 'CGPA': 'High', 'Gamer': 'Yes', 'Movie
Fanatic': 'No', 'Committed?': 'No'},
{'Branch': 'MECH', 'CGPA': 'Low', 'Gamer': 'No', 'Movie
Fanatic': 'Yes', 'Committed?': 'No'}
]
test_df = pd.DataFrame(test_samples)
X_test=test_df.drop(columns='Committed?').values
y_test=test_df['Committed?'].values
predictions = tree.predict(X_test)
print(f"Predictions: {predictions}")
print(f"True Labels: {y_test}")
accuracy = tree.score(X_test, y_test)
print(f"True Labels: {y_test}")
accuracy = tree.score(X_test, y_test)
print(f"Test Accuracy: {accuracy:.2f}")

Output:
-

----------------------FINISHED-----------------------

Submitted By-:
Name: PRAKHAR MADNANI
Enrol. No.-: 22104057

"Cryptography Essentials" Course Project: Instructions
No ratings yet
"Cryptography Essentials" Course Project: Instructions
4 pages
Simulated Annealing For VLSI Cell Placement
No ratings yet
Simulated Annealing For VLSI Cell Placement
14 pages
Qftnotes 3
No ratings yet
Qftnotes 3
15 pages
Ai Int-1
No ratings yet
Ai Int-1
6 pages
LAB-4 Report
No ratings yet
LAB-4 Report
21 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
All in One
No ratings yet
All in One
13 pages
Unit2 ML Programs
No ratings yet
Unit2 ML Programs
7 pages
ML File
No ratings yet
ML File
13 pages
ML5 Implementation
No ratings yet
ML5 Implementation
32 pages
Aiml Ex 4-7
No ratings yet
Aiml Ex 4-7
8 pages
ML Lab
No ratings yet
ML Lab
7 pages
ML Journal External
No ratings yet
ML Journal External
14 pages
ML Lab Experiment Shortened With Same Output
No ratings yet
ML Lab Experiment Shortened With Same Output
6 pages
Aiml Lab
No ratings yet
Aiml Lab
14 pages
Programs Lab Bca
No ratings yet
Programs Lab Bca
16 pages
Final ML Programs 075005
No ratings yet
Final ML Programs 075005
15 pages
ML Lab Manual
No ratings yet
ML Lab Manual
12 pages
ML
No ratings yet
ML
11 pages
ML Lab PT
No ratings yet
ML Lab PT
25 pages
1st PGM
No ratings yet
1st PGM
10 pages
DM ML Practical
No ratings yet
DM ML Practical
13 pages
Import Numpy As NP
No ratings yet
Import Numpy As NP
4 pages
Assignment #1: K Nearest Neighbor Classifier: Name: Srikanth Mujjiga (Roll No: 2015-50-831
No ratings yet
Assignment #1: K Nearest Neighbor Classifier: Name: Srikanth Mujjiga (Roll No: 2015-50-831
8 pages
Aiml Practical
No ratings yet
Aiml Practical
17 pages
Slip
No ratings yet
Slip
5 pages
Experiment01 Baseline Models Accuracy
No ratings yet
Experiment01 Baseline Models Accuracy
35 pages
Practicalpgm ML
No ratings yet
Practicalpgm ML
33 pages
PCA Codebase
No ratings yet
PCA Codebase
6 pages
Decision Tree
No ratings yet
Decision Tree
6 pages
Machine Learning Cheatsheet
No ratings yet
Machine Learning Cheatsheet
5 pages
1
No ratings yet
1
13 pages
AIML Prograns
No ratings yet
AIML Prograns
6 pages
Data Mining Assignment No. 1
No ratings yet
Data Mining Assignment No. 1
7 pages
Shobit Sharma (2124399) ML Lab File PDF
No ratings yet
Shobit Sharma (2124399) ML Lab File PDF
19 pages
AI Assignment-6
No ratings yet
AI Assignment-6
7 pages
Atul MLT Exp 4-11
No ratings yet
Atul MLT Exp 4-11
17 pages
1 10
No ratings yet
1 10
4 pages
Linearregression SVM
No ratings yet
Linearregression SVM
3 pages
22MCA1008 - Varun ML LAB ASSIGNMENTS
100% (1)
22MCA1008 - Varun ML LAB ASSIGNMENTS
41 pages
ML External Xerox
No ratings yet
ML External Xerox
1 page
ML II Lab
No ratings yet
ML II Lab
5 pages
Udacity Machine Learning Analysis Supervised Learning
100% (1)
Udacity Machine Learning Analysis Supervised Learning
504 pages
Assignment 5
No ratings yet
Assignment 5
5 pages
ML All Projectpdf Removed
No ratings yet
ML All Projectpdf Removed
41 pages
AI ML - Cycle 2 Programs
No ratings yet
AI ML - Cycle 2 Programs
15 pages
Program 4
No ratings yet
Program 4
3 pages
ML Lab Programs
No ratings yet
ML Lab Programs
8 pages
ML Algorithms
100% (1)
ML Algorithms
1 page
ML - LAB - 7 - Jupyter Notebook
100% (1)
ML - LAB - 7 - Jupyter Notebook
7 pages
Aam Codes
No ratings yet
Aam Codes
8 pages
ML Cheatsheet
No ratings yet
ML Cheatsheet
4 pages
Python For Data Science IA 1 Programs
No ratings yet
Python For Data Science IA 1 Programs
14 pages
Naive Bayes
No ratings yet
Naive Bayes
58 pages
ML Lab P-1
No ratings yet
ML Lab P-1
10 pages
Internal
No ratings yet
Internal
3 pages
Scikit-Learn Cheat Sheet
No ratings yet
Scikit-Learn Cheat Sheet
1 page
Scikit-Learn Cheat Sheet
No ratings yet
Scikit-Learn Cheat Sheet
1 page
Data Mining Practicals
No ratings yet
Data Mining Practicals
22 pages
Ai Last 5
No ratings yet
Ai Last 5
4 pages
Shubham Pract 6 - Merged
No ratings yet
Shubham Pract 6 - Merged
12 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Inverse Trigonometric Functions (Trigonometry) Mathematics Question Bank
From Everand
Inverse Trigonometric Functions (Trigonometry) Mathematics Question Bank
Mohmmad Khaja Shareef
No ratings yet
41 Essential Machine Learning Interview Questions: 18 Mins Read
No ratings yet
41 Essential Machine Learning Interview Questions: 18 Mins Read
21 pages
Module 5.6 - 5.7 Pearson R and Regression
No ratings yet
Module 5.6 - 5.7 Pearson R and Regression
25 pages
Cienciadedatos
No ratings yet
Cienciadedatos
21 pages
Annex C Robust Analysis: (Normative)
0% (1)
Annex C Robust Analysis: (Normative)
1 page
Assignment 2 Solution
No ratings yet
Assignment 2 Solution
4 pages
Robotics Assignment 1
No ratings yet
Robotics Assignment 1
9 pages
Two Port networks-NEO
No ratings yet
Two Port networks-NEO
30 pages
Computational Physics With Worked Out Examples in Fortran and Matlab Michael Bestehorn PDF Download
No ratings yet
Computational Physics With Worked Out Examples in Fortran and Matlab Michael Bestehorn PDF Download
64 pages
Gematmw Reviewer
No ratings yet
Gematmw Reviewer
14 pages
6 - Algorithmic Foundations
No ratings yet
6 - Algorithmic Foundations
33 pages
NASA-CR-33 Probability Functions For Random Responses - Prediction of Peaks, Fatigue Damage, and Catastrophic Failures
No ratings yet
NASA-CR-33 Probability Functions For Random Responses - Prediction of Peaks, Fatigue Damage, and Catastrophic Failures
60 pages
Compound Interest
No ratings yet
Compound Interest
12 pages
Intro To Crypto Graphy
No ratings yet
Intro To Crypto Graphy
13 pages
Classification of Facility Layout Problems: A Review Study: Original Article
No ratings yet
Classification of Facility Layout Problems: A Review Study: Original Article
21 pages
Qbasic Output
No ratings yet
Qbasic Output
12 pages
Character Recognition Using ANN
No ratings yet
Character Recognition Using ANN
52 pages
Unit 3 - Dsa
No ratings yet
Unit 3 - Dsa
76 pages
Lab 05
No ratings yet
Lab 05
5 pages
14 Forecasting2 NOTES
No ratings yet
14 Forecasting2 NOTES
19 pages
Tut RL-1
No ratings yet
Tut RL-1
2 pages
Practice Problems
No ratings yet
Practice Problems
2 pages
Syllabus
No ratings yet
Syllabus
2 pages
SPSS Assignment 3. Group 1. Schofield, Stuerman, Sulin and Williams
No ratings yet
SPSS Assignment 3. Group 1. Schofield, Stuerman, Sulin and Williams
10 pages
Advance-Math Portfolio Carbon
No ratings yet
Advance-Math Portfolio Carbon
98 pages
BookSlides 5A Similarity Based Learning
No ratings yet
BookSlides 5A Similarity Based Learning
40 pages
Signals and Systems
No ratings yet
Signals and Systems
42 pages
Asymptotic Analysis
No ratings yet
Asymptotic Analysis
28 pages

Prakhar - Week 5

Uploaded by

Prakhar - Week 5

Uploaded by

DATA MINING & WEB ALGORITHMS LAB

Ans 1. import math

def predict(self, X_test):

def _entropy(self, y):

def _info_gain(self, X, y, feature_idx):

def _best_split(self, X, y):

def _build_tree(self, X, y, depth=0):

def fit(self, X, y):

def predict(self, X):

def _predict_one(self, x, tree):

def score(self, X_test, y_test):

You might also like