# Connet to Google
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive

import numpy as np

from sklearn import tree

from matplotlib import pyplot as plt
%matplotlib inline
plt.style.use('ggplot')


tp = {'French': 0, 'Thai': 1, 'Italian': 2, 'Burger': 3}  # To encode the Type variable
price = {'$': 0, '$$': 1, '$$$': 2}                       # To encode the Price variable
est = {'0-10': 0, '10-30': 1, '30-60': 2, '>60': 3}       # To encode the Wait Estimate
pat = {'None': 0, 'Some': 1, 'Full': 2}                   # To encode the Patrons variable

x = np.array([
# 0     1      2     3       4            5             6      7      8              9
# Alt   Bar    Fri    Hun    Pat          Price         Rain   Res    Type           Est
[True,  False, False, True,  pat['Some'], price['$$$'], False, True,  tp['French'],  est['0-10']], # True
[True,  False, False, True,  pat['Full'], price['$'],   False, False, tp['Thai'],    est['30-60']], # False
[False, True,  False, False, pat['Some'], price['$'],   False, False, tp['Burger'],  est['0-10']], # True
[True,  False, True,  True,  pat['Full'], price['$'],   True,  False, tp['Thai'],    est['10-30']], # Frue
[True,  False, True,  False, pat['Full'], price['$$$'], False, True,  tp['French'],  est['>60']], # False
[False, True,  False, True,  pat['Some'], price['$$'],  True,  True,  tp['Italian'], est['0-10']], # True
[False, True,  False, False, pat['None'], price['$'],   True,  False, tp['Thai'],    est['10-30']], # False
[False, False, False, True,  pat['Some'], price['$$'],  True,  True,  tp['Thai'],    est['0-10']], # True
[False, True,  True,  False, pat['Full'], price['$'],   True,  False, tp['Burger'],  est['>60']], # False
[True,  True,  True,  True,  pat['Full'], price['$$$'], False, True,  tp['Italian'], est['10-30']], # False
[False, False, False, False, pat['None'], price['$'],   False, False, tp['Thai'],    est['0-10']], # False
[True,  True,  True,  True,  pat['Full'], price['$'],   False, False, tp['Burger'],  est['30-60']], # True
])

y = np.array([True, False, True, True, False, True, False, True, False, False, False, True])

def entropyfn(pos, neg):
    log = np.log2
    tot = pos+neg

    pos = pos / tot
    neg = neg / tot

    if neg == 0:
        return -pos * log(pos)

    if pos == 0:
        return -neg * log(neg)

    return -pos * log(pos)-neg * log(neg)

# Build a Decision Tree Classifier
clf = tree.DecisionTreeClassifier(random_state = 0, criterion = 'entropy', max_depth = 3)

clf = clf.fit(x, y)

fig, ax = plt.subplots(figsize = (10, 6))

out = tree.plot_tree(clf, filled = True, fontsize = 10)

for o in out:

    arrow = o.arrow_patch

    if arrow is not None:
        arrow.set_edgecolor('red')

        arrow.set_linewidth(3)

plt.show()

# Convert notebook to html
!jupyter nbconvert --to html "/content/drive/MyDrive/MIT - Data Sciences/Colab Notebooks/Week_Five_-_Classification_and_Hypothesis_Testing/Restaurant_Waiting/Practical_Application_Restaurant_Data.ipynb"

Customers in Restaurants¶

Objective¶

Dataset Description¶

Importing the libraries¶