Search
 
SCRIPT & CODE EXAMPLE
 

PYTHON

id3 algorithm code in python

import pandas as pd
import math
import numpy as np

data = pd.read_csv("3-dataset.csv")
features = [feat for feat in data]
features.remove("answer")

class Node:
    def __init__(self):
        self.children = []
        self.value = ""
        self.isLeaf = False
        self.pred = ""

def entropy(examples):
    pos = 0.0
    neg = 0.0
    for _, row in examples.iterrows():
        if row["answer"] == "yes":
            pos += 1
        else:
            neg += 1
    if pos == 0.0 or neg == 0.0:
        return 0.0
    else:
        p = pos / (pos + neg)
        n = neg / (pos + neg)
        return -(p * math.log(p, 2) + n * math.log(n, 2))

def info_gain(examples, attr):
    uniq = np.unique(examples[attr])
    #print ("
",uniq)
    gain = entropy(examples)
    #print ("
",gain)
    for u in uniq:
        subdata = examples[examples[attr] == u]
        #print ("
",subdata)
        sub_e = entropy(subdata)
        gain -= (float(len(subdata)) / float(len(examples))) * sub_e
        #print ("
",gain)
    return gain

def ID3(examples, attrs):
    root = Node()

    max_gain = 0
    max_feat = ""
    for feature in attrs:
        #print ("
",examples)
        gain = info_gain(examples, feature)
        if gain > max_gain:
            max_gain = gain
            max_feat = feature
    root.value = max_feat
    #print ("
Max feature attr",max_feat)
    uniq = np.unique(examples[max_feat])
    #print ("
",uniq)
    for u in uniq:
        #print ("
",u)
        subdata = examples[examples[max_feat] == u]
        #print ("
",subdata)
        if entropy(subdata) == 0.0:
            newNode = Node()
            newNode.isLeaf = True
            newNode.value = u
            newNode.pred = np.unique(subdata["answer"])
            root.children.append(newNode)
        else:
            dummyNode = Node()
            dummyNode.value = u
            new_attrs = attrs.copy()
            new_attrs.remove(max_feat)
            child = ID3(subdata, new_attrs)
            dummyNode.children.append(child)
            root.children.append(dummyNode)
    return root

def printTree(root: Node, depth=0):
    for i in range(depth):
        print("	", end="")
    print(root.value, end="")
    if root.isLeaf:
        print(" -> ", root.pred)
    print()
    for child in root.children:
        printTree(child, depth + 1)

root = ID3(data, features)
printTree(root)
Comment

PREVIOUS NEXT
Code Example
Python :: pytesseract.image_to_data(img output_type=output.dict) 
Python :: Merge two Querysets in Python Django while preserving Queryset methods 
Python :: how to get one record in django 
Python :: how to make a square in python 
Python :: django not migrating 
Python :: are tuples in python mutable 
Python :: scrapy get text custom tags 
Python :: jupyter notebook bold text 
Python :: python kivy bind 
Python :: python argsort 
Python :: keras name model 
Python :: flask windows auto reload 
Python :: ner spacy 
Python :: return array of sorted objects 
Python :: how to address null in python 
Python :: protected class python 
Python :: protected vs private python 
Python :: package in python 
Python :: counter python time complexity 
Python :: add columns not in place 
Python :: parse_dates 
Python :: get midnight of current day python 
Python :: Python Pandas - How to write in a specific column in an Excel Sheet 
Python :: django venv activate 
Python :: Python Program to Sort Words in Alphabetic Order 
Python :: how to create fastapi 
Python :: python typing 
Python :: keep the user logged in even though user changes password django 
Python :: pandas using eval converter excluding nans 
Python :: set default palette seaborn 
ADD CONTENT
Topic
Content
Source link
Name
4+7 =