Program

The document describes an implementation of the ID3 decision tree algorithm in Python. It includes functions for calculating entropy, information gain, generating child nodes, and recursively constructing a decision tree from a dataset. The main function constructs a decision tree from a sample CSV dataset and prints out the resulting tree.

Uploaded by

Chandu sandy

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

15 views

Program

Uploaded by

Chandu sandy

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 4

Program 4

Demonstrate the working of the decision tree based ID3 algorithm. Use an appropriate data set for
building the decision tree and apply this knowledge to classify a new sample.

import pandas as pd
import math

# function to calculate the entropy of entire dataset

# -----------------------------------------------------------------------
def base_entropy(dataset):
p=0
n=0
target = dataset.iloc[:, -1]
targets = list(set(target))
for i in target:
if i == targets[0]:
p=p+1
else:
n=n+1
if p == 0 or n == 0:
return 0
elif p == n:
return 1
else:
entropy = 0 - (
((p / (p + n)) * (math.log2(p / (p + n))) + (n / (p + n)) * (math.log2(n/ (p + n)))))
return entropy

# -----------------------------------------------------------------------

# function to calculate the entropy of attributes

# -----------------------------------------------------------------------
def entropy(dataset, feature, attribute):
p=0
n=0
target = dataset.iloc[:, -1]
targets = list(set(target))
for i, j in zip(feature, target):
if i == attribute and j == targets[0]:
p=p+1
elif i == attribute and j == targets[1]:
n=n+1
if p == 0 or n == 0:
return 0
elif p == n:
return 1
else:
entropy = 0 - (
((p / (p + n)) * (math.log2(p / (p + n))) + (n / (p + n)) * (math.log2(n/ (p + n)))))
return entropy

# -----------------------------------------------------------------------
# a utility function for checking purity and impurity of a child
# -----------------------------------------------------------------------
def counter(target, attribute, i):
p=0
n=0
targets = list(set(target))
for j, k in zip(target, attribute):
if j == targets[0] and k == i:
p=p+1
elif j == targets[1] and k == i:
n=n+1
return p, n

# -----------------------------------------------------------------------
# function that calculates the information gain
# -----------------------------------------------------------------------
def Information_Gain(dataset, feature):
Distinct = list(set(feature))
Info_Gain = 0
for i in Distinct:
Info_Gain = Info_Gain + feature.count(i) / len(feature) * entropy(dataset,feature, i)
Info_Gain = base_entropy(dataset) - Info_Gain
return Info_Gain

# -----------------------------------------------------------------------

# function that generates the childs of selected Attribute

# -----------------------------------------------------------------------
def generate_childs(dataset, attribute_index):
distinct = list(dataset.iloc[:, attribute_index])
childs = dict()
for i in distinct:
childs[i] = counter(dataset.iloc[:, -1], dataset.iloc[:, attribute_index], i)
return childs

# -----------------------------------------------------------------------

# function that modifies the dataset according to the impure childs

# -----------------------------------------------------------------------
def modify_data_set(dataset,index, feature, impurity):
size = len(dataset)
subdata = dataset[dataset[feature] == impurity]
del (subdata[subdata.columns[index]])
return subdata

# -----------------------------------------------------------------------

# function that return attribute with the greatest Information Gain

# -----------------------------------------------------------------------
def greatest_information_gain(dataset):
max = -1
attribute_index = 0
size = len(dataset.columns) - 1
for i in range(0, size):
feature = list(dataset.iloc[:, i])
i_g = Information_Gain(dataset, feature)
if max < i_g:
max = i_g
attribute_index = i
return attribute_index

# -----------------------------------------------------------------------

# function to construct the decision tree

# -----------------------------------------------------------------------
def construct_tree(dataset, tree):
target = dataset.iloc[:, -1]
impure_childs = []
attribute_index = greatest_information_gain(dataset)
childs = generate_childs(dataset, attribute_index)
tree[dataset.columns[attribute_index]] = childs
targets = list(set(dataset.iloc[:, -1]))
for k, v in childs.items():
if v[0] == 0:
tree[k] = targets[1]
elif v[1] == 0:
tree[k] = targets[0]
elif v[0] != 0 or v[1] != 0:
impure_childs.append(k)
for i in impure_childs:
sub = modify_data_set(dataset,attribute_index,
dataset.columns[attribute_index], i)
tree = construct_tree(sub, tree)
return tree

# ---------------------------------------------------------------------------
# main function
# -----------------------------------------------------------------------
def main():
df = pd.read_csv("filename.csv")
tree = dict()
result = construct_tree(df, tree)
for key, value in result.items():
print(key, " => ", value)

# -----------------------------------------------------------------------

if __name__ == "__main__":
main()
OUTPUT

outlook => {'sunny': (3, 2), 'overcast': (0, 4), 'rainy': (2, 3)}
overcast => yes
temp => {'mild': (1, 2), 'cool': (1, 1)}
hot => no
cool => yes
humidity => {'normal': (1, 1)}
high => no
normal => yes
windy => {'Weak': (0, 1), 'Strong': (1, 0)}
Weak => yes
Strong => no

cd3281 Final Copy Lab Manual
100% (1)
cd3281 Final Copy Lab Manual
44 pages
CS-301 Latest Mcq's Final Term by Vu Topper RM
100% (1)
CS-301 Latest Mcq's Final Term by Vu Topper RM
24 pages
C Program For Binary Search Tree
89% (19)
C Program For Binary Search Tree
6 pages
Play Tennis Prog 4
No ratings yet
Play Tennis Prog 4
3 pages
ML Lab Prog1-5 (5) College PDF
No ratings yet
ML Lab Prog1-5 (5) College PDF
12 pages
Lab
No ratings yet
Lab
13 pages
ML Lab Programs 1-10-Converted NAM COLLEGE PDF
No ratings yet
ML Lab Programs 1-10-Converted NAM COLLEGE PDF
33 pages
indexdw (1)
No ratings yet
indexdw (1)
34 pages
Lab 3 ml
No ratings yet
Lab 3 ml
3 pages
ML Exp 3
No ratings yet
ML Exp 3
6 pages
ML Lab Manual
No ratings yet
ML Lab Manual
90 pages
ML 5
No ratings yet
ML 5
2 pages
Lab Manual
No ratings yet
Lab Manual
25 pages
Machine Learning Through Python Lab Mannual
No ratings yet
Machine Learning Through Python Lab Mannual
33 pages
Lab Program 3
No ratings yet
Lab Program 3
6 pages
Import Import Def
No ratings yet
Import Import Def
2 pages
AIML Lab Programs
No ratings yet
AIML Lab Programs
13 pages
DA_LAB3_221IT064
No ratings yet
DA_LAB3_221IT064
6 pages
Pra 5 ML
No ratings yet
Pra 5 ML
5 pages
LAB 3
No ratings yet
LAB 3
7 pages
Code:: To Find Frequent Itemsets and Association Between Different Itemsets Using Apriori Algorithm
No ratings yet
Code:: To Find Frequent Itemsets and Association Between Different Itemsets Using Apriori Algorithm
28 pages
Name: Suprit Darshan Shrestha Reg - no:19BCE2584: Lab DA1 Machine Learning Lab
No ratings yet
Name: Suprit Darshan Shrestha Reg - no:19BCE2584: Lab DA1 Machine Learning Lab
9 pages
ML Lab Manual
No ratings yet
ML Lab Manual
28 pages
DECISION TREES
No ratings yet
DECISION TREES
7 pages
PESIT Bangalore South Campus: Vii Semester Lab Manual Subject: Machine Learning
No ratings yet
PESIT Bangalore South Campus: Vii Semester Lab Manual Subject: Machine Learning
31 pages
Lab_Manual2 (2)
No ratings yet
Lab_Manual2 (2)
6 pages
Machine Learning Lab Manual
No ratings yet
Machine Learning Lab Manual
26 pages
Machine Learning Laboratory Record Book: 1 Find S Algorithm
No ratings yet
Machine Learning Laboratory Record Book: 1 Find S Algorithm
22 pages
Codes & Outputs (1)
No ratings yet
Codes & Outputs (1)
9 pages
221IT027_DA_lab3 (2)
No ratings yet
221IT027_DA_lab3 (2)
5 pages
ML File
No ratings yet
ML File
13 pages
da-lab3-221it084-final (1)
No ratings yet
da-lab3-221it084-final (1)
6 pages
Machine Learning Laboratory Manual
No ratings yet
Machine Learning Laboratory Manual
11 pages
ML Lab Record
No ratings yet
ML Lab Record
33 pages
Machine Learning Unit4
No ratings yet
Machine Learning Unit4
8 pages
MLExp 3
No ratings yet
MLExp 3
6 pages
3ID3 Algorithm
No ratings yet
3ID3 Algorithm
9 pages
MLAll Practical
No ratings yet
MLAll Practical
27 pages
ML lab manual
No ratings yet
ML lab manual
25 pages
ASSESSMENT2
No ratings yet
ASSESSMENT2
22 pages
ML Lab Program3
No ratings yet
ML Lab Program3
3 pages
Machine Learning Lab Record: Dr. Sarika Hegde
No ratings yet
Machine Learning Lab Record: Dr. Sarika Hegde
23 pages
Machine Learning Lab (17CSL76)
No ratings yet
Machine Learning Lab (17CSL76)
48 pages
Practical 3
No ratings yet
Practical 3
3 pages
AIML
No ratings yet
AIML
12 pages
MLT Shivani
No ratings yet
MLT Shivani
8 pages
PRG 4
No ratings yet
PRG 4
2 pages
Screenshot 2023-12-07 at 11.07.49 AM
No ratings yet
Screenshot 2023-12-07 at 11.07.49 AM
14 pages
ID3 Program4
No ratings yet
ID3 Program4
3 pages
ML Lab Manual
No ratings yet
ML Lab Manual
14 pages
15CSL76 Students
No ratings yet
15CSL76 Students
18 pages
ASSESSMENT2
No ratings yet
ASSESSMENT2
22 pages
ML Lab
No ratings yet
ML Lab
9 pages
ML Lab Programs
No ratings yet
ML Lab Programs
21 pages
Aiml Lab
No ratings yet
Aiml Lab
14 pages
Pramkk
No ratings yet
Pramkk
10 pages
1 - All Python Codes + Neo4j Samples
No ratings yet
1 - All Python Codes + Neo4j Samples
16 pages
Algorithm
No ratings yet
Algorithm
8 pages
Machine Learning Manual Final
No ratings yet
Machine Learning Manual Final
37 pages
ml_labmanual (3)
No ratings yet
ml_labmanual (3)
33 pages
Lab 3 IA2
No ratings yet
Lab 3 IA2
3 pages
Python For Beginners
From Everand
Python For Beginners
Célio Azevedo
No ratings yet
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
CS210 Solutions For Quiz 1-3 Quiz 1: 1. Programming Model
No ratings yet
CS210 Solutions For Quiz 1-3 Quiz 1: 1. Programming Model
16 pages
DM 20 Introduction Trees
No ratings yet
DM 20 Introduction Trees
18 pages
DSU Chapter No 5 Tree
No ratings yet
DSU Chapter No 5 Tree
13 pages
6
No ratings yet
6
5 pages
Unit 3&5 Trees
No ratings yet
Unit 3&5 Trees
54 pages
D1, L5 Kruskal's and Prim's Algorithms
No ratings yet
D1, L5 Kruskal's and Prim's Algorithms
18 pages
Engineering Digest DSA Sheet
No ratings yet
Engineering Digest DSA Sheet
8 pages
IT245 - Module 6
No ratings yet
IT245 - Module 6
24 pages
Search and Sort Algorithm
No ratings yet
Search and Sort Algorithm
37 pages
Trees: Discrete Mathematics
No ratings yet
Trees: Discrete Mathematics
40 pages
Threaded Binary Trees
No ratings yet
Threaded Binary Trees
13 pages
Red Black Tree
No ratings yet
Red Black Tree
72 pages
AVL
No ratings yet
AVL
5 pages
Minimum spanning tree using Prims algorithm
No ratings yet
Minimum spanning tree using Prims algorithm
20 pages
Algo 2
No ratings yet
Algo 2
9 pages
Source:Mark Allen Weiss
No ratings yet
Source:Mark Allen Weiss
14 pages
2000 Cho Sahni
No ratings yet
2000 Cho Sahni
62 pages
PPT6 - Binary Search Tree
No ratings yet
PPT6 - Binary Search Tree
33 pages
AVL Trees
No ratings yet
AVL Trees
43 pages
Data Structure and Algorithm (CS-102) : Dr. Manmath N. Sahoo Dept. of CSE, NIT Rourkela
No ratings yet
Data Structure and Algorithm (CS-102) : Dr. Manmath N. Sahoo Dept. of CSE, NIT Rourkela
52 pages
QPaper DS R21 Apr 2023
No ratings yet
QPaper DS R21 Apr 2023
2 pages
Data Structures - UNIT 3
No ratings yet
Data Structures - UNIT 3
40 pages
Minimum Spanning Trees
No ratings yet
Minimum Spanning Trees
23 pages
About: Tag: Tree Data Structure
No ratings yet
About: Tag: Tree Data Structure
5 pages
Segment Tree and Lazy Propagation - HackerEarth
No ratings yet
Segment Tree and Lazy Propagation - HackerEarth
23 pages
Datastructure and Algorithms MCQ
100% (1)
Datastructure and Algorithms MCQ
6 pages
Data Structures Algorithms Mock Test
No ratings yet
Data Structures Algorithms Mock Test
6 pages