from sklearn.ensemble import AdaBoostClassifier
from sklearn.tree import DecisionTreeClassifier
from matplotlib.colors import ListedColormap
import matplotlib.pyplot as plt
from matplotlib.colors import ListedColormap
import numpy as np
import seaborn as sns
import pandas as pd


def AdaBoost_scratch(X,y, M, learning_rate, depth = 1):
    #Initialization of utility variables
    N = len(y)
    estimator_list, y_predict_list, estimator_error_list, estimator_weight_list, sample_weight_list = [], [],[],[],[]

    #Initialize the sample weights
    sample_weight = np.ones(N) / N
    sample_weight_list.append(sample_weight.copy())

    #For m = 1 to M
    for m in range(M):   

        #Fit a classifier
        estimator = DecisionTreeClassifier(max_depth = depth)
        estimator.fit(X, y, sample_weight=sample_weight)
        y_predict = estimator.predict(X)

        #Misclassifications
        incorrect = (y_predict != y)

        #Estimator error
        estimator_error = np.mean( np.average(incorrect, weights=sample_weight, axis=0))
        
        #Boost estimator weights
        estimator_weight =  learning_rate * np.log((1. - estimator_error) / estimator_error)

        #Boost sample weights
        sample_weight *= np.exp(estimator_weight * incorrect * ((sample_weight > 0) | (estimator_weight < 0)))

        #Save iteration values
        estimator_list.append(estimator)
        y_predict_list.append(y_predict.copy())
        estimator_error_list.append(estimator_error.copy())
        estimator_weight_list.append(estimator_weight.copy())
        sample_weight_list.append(sample_weight.copy())
        


    #Convert to np array for convenience   
    estimator_list = np.asarray(estimator_list)
    y_predict_list = np.asarray(y_predict_list)
    estimator_error_list = np.asarray(estimator_error_list)
    estimator_weight_list = np.asarray(estimator_weight_list)
    sample_weight_list = np.asarray(sample_weight_list)

    #Predictions
    preds = (np.array([np.sign((y_predict_list[:,point] * estimator_weight_list).sum()) for point in range(N)]))
    
    print('')
    print('Accuracy = ', (preds == y).sum() / N) 
    print('')
    
    return estimator_list, estimator_weight_list, sample_weight_list

def plot_AdaBoost_scratch_boundary(estimators,estimator_weights, X, y, N = 10,ax = None ):
    
    def AdaBoost_scratch_classify(x_temp, est,est_weights ):
        '''Return classification prediction for a given point X and a previously fitted AdaBoost'''
        temp_pred = np.asarray( [ (e.predict(x_temp)).T* w for e, w in zip(est,est_weights )]  ) / est_weights.sum()
        return np.sign(temp_pred.sum(axis = 0))
    
    
    '''Utility function to plot decision boundary and scatter plot of data'''
    x_min, x_max = X[:, 0].min() - .1, X[:, 0].max() + .1
    y_min, y_max = X[:, 1].min() - .1, X[:, 1].max() + .1
    xx, yy = np.meshgrid( np.linspace(x_min, x_max, N), np.linspace(y_min, y_max, N))


    zz = np.array( [AdaBoost_scratch_classify(np.array([xi,yi]).reshape(1,-1), estimators,estimator_weights ) for  xi, yi in zip(np.ravel(xx), np.ravel(yy)) ] )
            
    # reshape result and plot
    Z = zz.reshape(xx.shape)
    cm_bright = ListedColormap(['#FF0000', '#0000FF'])
    
    if ax is None:
        ax = plt.gca()
    ax.contourf(xx, yy, Z, 2, cmap='RdBu', alpha=.5)
    ax.contour(xx, yy, Z,  2, cmap='RdBu')
    ax.scatter(X[:,0],X[:,1], c = y, cmap = cm_bright)
    ax.set_xlabel('$X_1$')
    ax.set_ylabel('$X_2$')
    
def adaboost_steps(df, L=1):
    df['Stump 1']=np.sign(x2-2.5).astype(int)
    df['Weight 1'] = np.repeat(1/len(df), len(df))
    e1 = df[df['Stump 1']*df['y']==-1]['Weight 1'].sum()

    alpha1 = L*.5*np.log((1-e1)/e1)
    alpha1
    df['Weight 2'] = df['Weight 1']*np.exp(alpha1*(-df['y']*df['Stump 1']))
    df['Weight 2'] = df['Weight 2']/sum(df['Weight 2'])
    df

    df['Stump 2']=-np.sign(x1-1.5).astype(int)
    
    e2 = df[df['Stump 2']*df['y']==-1]['Weight 2'].sum()

    alpha2 = L*.5*np.log((1-e2)/e2)
    df['Weight 3'] = df['Weight 2']*np.exp(alpha2*(-df['y']*df['Stump 2']))
    df['Weight 3'] = df['Weight 3']/sum(df['Weight 3'])

    df['Stump 3']=-np.sign(x1-4.5).astype(int)
    e3 = df[df['Stump 3']*df['y']==-1]['Weight 3'].sum()

    alpha3 = L*.5*np.log((1-e3)/e3)
    
    print('')
    print('Voting Power of Stump 1:', np.round(alpha1, decimals=4))
    print('Voting Power of Stump 2:', np.round(alpha2, decimals=4))
    print('Voting Power of Stump 3:', np.round(alpha3, decimals=4))
    print('')

    return df

x1 = np.array([1, 1, 2, 2, 3, 3, 3, 4, 5, 5])
x2 = np.array([1, 3, 2, 4, 1, 2, 5, 4,   2, 5])
y = np.array([ 1, 1,-1, 1,-1, -1, 1, 1,  -1,-1])


X = np.vstack((x1,x2)).T
df = pd.DataFrame({'x1':x1, 'x2':x2, 'y':y})

ax = plt.gca()
cm_bright = ListedColormap(['#FF0000', '#0000FF'])
scatter_weights = np.ones(len(y))
ax.scatter(X[:,0],X[:,1], c = y, cmap = cm_bright, s = scatter_weights* 40)

ax.set_xlabel('$X_1$')
ax.set_ylabel('$X_2$')

ax
#plt.savefig('ada_scatter.png')

<Axes: xlabel='$X_1$', ylabel='$X_2$'>

round = 1
L = .1 # learning rate

estimator_list, estimator_weight_list, sample_weight_list  = AdaBoost_scratch(X,y, M=round, depth = 1, 
                                                                              learning_rate = L)

plot_AdaBoost_scratch_boundary(estimator_list, estimator_weight_list, X, y, N = 50 )

Accuracy =  0.8

round = 20
L = .1

estimator_list, estimator_weight_list, sample_weight_list  = AdaBoost_scratch(X,y, M=round, depth = 1, 
                                                                              learning_rate = L)

plot_AdaBoost_scratch_boundary(estimator_list, estimator_weight_list, X, y, N = 50 )

Accuracy =  1.0

ac = pd.DataFrame([], columns=list(['Rounds','Learning Rate','Accuracy']))
for rs in range(1, 100):
    for lr in [.01, .1, .5]:
        boost = AdaBoostClassifier(estimator = DecisionTreeClassifier(max_depth = 1, max_leaf_nodes=2), 
                            n_estimators=rs, learning_rate=lr)
        boost.fit(X,y)
        
        ac = pd.concat([ac, pd.DataFrame([[rs, lr, boost.score(X,y) ]], 
                            columns=list(['Rounds','Learning Rate','Accuracy']))], ignore_index=True)

import seaborn as sns; sns.set()
import matplotlib.pyplot as plt
ax = sns.lineplot(x="Rounds", y="Accuracy", hue =ac['Learning Rate'].astype('category'),data=ac)

C:\Users\sonou\AppData\Local\Temp\ipykernel_8048\2467927930.py:8: FutureWarning: The behavior of DataFrame concatenation with empty or all-NA entries is deprecated. In a future version, this will no longer exclude empty or all-NA columns when determining the result dtypes. To retain the old behavior, exclude the relevant entries before the concat operation.
  ac = pd.concat([ac, pd.DataFrame([[rs, lr, boost.score(X,y) ]],

x1 = np.array([1, 1, 2, 2, 3, 3, 3, 4, 5, 5])
x2 = np.array([1, 3, 2, 4, 1, 2, 5, 4,   2, 5])
y = np.array([ 1, 1,-1, 1,-1, -1, 1, 1,  -1,-1])

X = np.vstack((x1,x2)).T
df = pd.DataFrame({'x1':x1, 'x2':x2, 'y':y})

ax = plt.gca()
cm_bright = ListedColormap(['#FF0000', '#0000FF'])
scatter_weights = np.ones(len(y))
ax.scatter(X[:,0],X[:,1], c = y, cmap = cm_bright, s = scatter_weights* 40)

ax.set_xlabel('$X_1$')
ax.set_ylabel('$X_2$')

ax

plt.figure()

ac = pd.DataFrame([], columns=list(['Rounds','Learning Rate','Accuracy']))
for rs in range(1, 50):
    for lr in [.2,.8, 2]:
        boost = AdaBoostClassifier(estimator = DecisionTreeClassifier(max_depth = 1, max_leaf_nodes=2), 
                            algorithm = 'SAMME',n_estimators=rs, learning_rate=lr)
        boost.fit(X,y)
        ac = pd.concat([ac, pd.DataFrame([[rs, lr, boost.score(X,y) ]], 
                            columns=list(['Rounds','Learning Rate','Accuracy']))], ignore_index=True)

import seaborn as sns; sns.set()
import matplotlib.pyplot as plt
ax = sns.lineplot(x="Rounds", y="Accuracy", hue =ac['Learning Rate'].astype('category'),data=ac)

C:\Users\snguyen4\AppData\Local\Temp\ipykernel_25720\2548598675.py:26: FutureWarning: The behavior of DataFrame concatenation with empty or all-NA entries is deprecated. In a future version, this will no longer exclude empty or all-NA columns when determining the result dtypes. To retain the old behavior, exclude the relevant entries before the concat operation.
  ac = pd.concat([ac, pd.DataFrame([[rs, lr, boost.score(X,y) ]],

fig = ax.get_figure()
fig.savefig('learning_rate_vs_accuracy.png')

x1 = np.array([1, 1, 2, 2, 3, 3, 3, 4, 5, 5, 3])
x2 = np.array([1, 3, 2, 4, 1, 2, 5, 4,   2, 5, 4])
y = np.array([ 1, 1,-1, 1,-1, -1, 1, 1,  -1,-1, -1])

X = np.vstack((x1,x2)).T
df = pd.DataFrame({'x1':x1, 'x2':x2, 'y':y})

ax = plt.gca()
cm_bright = ListedColormap(['#FF0000', '#0000FF'])
scatter_weights = np.ones(len(y))
ax.scatter(X[:,0],X[:,1], c = y, cmap = cm_bright, s = scatter_weights* 40)

ax.set_xlabel('$X_1$')
ax.set_ylabel('$X_2$')

ax

plt.figure()

ac = pd.DataFrame([], columns=list(['Rounds','Learning Rate','Accuracy']))

for rs in range(1, 20):
    for lr in [.2,.8, 2]:
        boost = AdaBoostClassifier(estimator = DecisionTreeClassifier(max_depth = 1, max_leaf_nodes=2), 
                            algorithm = 'SAMME',n_estimators=rs, learning_rate=lr)
        boost.fit(X,y)
        ac = pd.concat([ac, pd.DataFrame([[rs, lr, boost.score(X,y) ]], 
                            columns=list(['Rounds','Learning Rate','Accuracy']))], ignore_index=True)

import seaborn as sns; sns.set()
import matplotlib.pyplot as plt
ax = sns.lineplot(x="Rounds", y="Accuracy", hue =ac['Learning Rate'].astype('category'),data=ac)

C:\Users\snguyen4\AppData\Local\Temp\ipykernel_25720\1902686926.py:27: FutureWarning: The behavior of DataFrame concatenation with empty or all-NA entries is deprecated. In a future version, this will no longer exclude empty or all-NA columns when determining the result dtypes. To retain the old behavior, exclude the relevant entries before the concat operation.
  ac = pd.concat([ac, pd.DataFrame([[rs, lr, boost.score(X,y) ]],

x1 = np.array([1, 1, 2, 2, 3, 3, 3, 4, 5, 5, 1])
x2 = np.array([1, 3, 2, 4, 1, 2, 5, 4,   2, 5, 5])
y = np.array([ 1, 1,-1, 1,-1, -1, 1, 1,  -1,-1, -1])


X = np.vstack((x1,x2)).T
df = pd.DataFrame({'x1':x1, 'x2':x2, 'y':y})

ax = plt.gca()
cm_bright = ListedColormap(['#FF0000', '#0000FF'])
scatter_weights = np.ones(len(y))
ax.scatter(X[:,0],X[:,1], c = y, cmap = cm_bright, s = scatter_weights* 40)

ax.set_xlabel('$X_1$')
ax.set_ylabel('$X_2$')

ax

plt.figure()

<Figure size 640x480 with 0 Axes>

<Figure size 640x480 with 0 Axes>

round = 20
L = 1

estimator_list, estimator_weight_list, sample_weight_list  = AdaBoost_scratch(X,y, M=round, depth = 2, 
                                                                              learning_rate = L)

plot_AdaBoost_scratch_boundary(estimator_list, estimator_weight_list, X, y, N = 50 )

Accuracy =  1.0

x1 = np.array([1, 1, 2, 2, 3, 3, 3, 4, 5, 5, 1])
x2 = np.array([1, 3, 2, 4, 1, 2, 5, 4,   2, 5, 5])
y = np.array([ 1, 1,-1, 1,-1, -1, 1, 1,  -1,-1, -1])


X = np.vstack((x1,x2)).T
df = pd.DataFrame({'x1':x1, 'x2':x2, 'y':y})

ax = plt.gca()
cm_bright = ListedColormap(['#FF0000', '#0000FF'])
scatter_weights = np.ones(len(y))
ax.scatter(X[:,0],X[:,1], c = y, cmap = cm_bright, s = scatter_weights* 40)

ax.set_xlabel('$X_1$')
ax.set_ylabel('$X_2$')

ax

plt.figure()

ac = pd.DataFrame([], columns=list(['Rounds','Learning Rate','Accuracy']))
for rs in range(1, 100):
    for lr in [.2,1, 2]:
        boost = AdaBoostClassifier(estimator = DecisionTreeClassifier(max_depth = 2, max_leaf_nodes=3), 
                            algorithm = 'SAMME',n_estimators=rs, learning_rate=lr)
        boost.fit(X,y)
        ac = pd.concat([ac, pd.DataFrame([[rs, lr, boost.score(X,y) ]], 
                            columns=list(['Rounds','Learning Rate','Accuracy']))], ignore_index=True)
        

import seaborn as sns; sns.set()
import matplotlib.pyplot as plt
ax = sns.lineplot(x="Rounds", y="Accuracy", hue =ac['Learning Rate'].astype('category'),data=ac)

C:\Users\snguyen4\AppData\Local\Temp\ipykernel_15384\355853893.py:27: FutureWarning: The behavior of DataFrame concatenation with empty or all-NA entries is deprecated. In a future version, this will no longer exclude empty or all-NA columns when determining the result dtypes. To retain the old behavior, exclude the relevant entries before the concat operation.
  ac = pd.concat([ac, pd.DataFrame([[rs, lr, boost.score(X,y) ]],

round = 20
L = .1

estimator_list, estimator_weight_list, sample_weight_list  = AdaBoost_scratch(X,y, M=round, depth = 2, 
                                                                              learning_rate = L)

plot_AdaBoost_scratch_boundary(estimator_list, estimator_weight_list, X, y, N = 50 )

Accuracy =  1.0

x1 = np.array([1, 1, 2, 2, 3, 3, 3, 4, 5, 5, 4])
x2 = np.array([1, 3, 2, 4, 1, 2, 5, 4,   2, 5, 2])
y = np.array([ 1, 1,-1, 1,-1, -1, 1, 1,  -1,-1, 1])


X = np.vstack((x1,x2)).T
df = pd.DataFrame({'x1':x1, 'x2':x2, 'y':y})

ax = plt.gca()
cm_bright = ListedColormap(['#FF0000', '#0000FF'])
scatter_weights = np.ones(len(y))
ax.scatter(X[:,0],X[:,1], c = y, cmap = cm_bright, s = scatter_weights* 40)

ax.set_xlabel('$X_1$')
ax.set_ylabel('$X_2$')

ax

plt.figure()

ac = pd.DataFrame([], columns=list(['Rounds','Learning Rate','Accuracy']))
for rs in range(1, 100):
    for lr in [.2, 1, 2]:
        boost = AdaBoostClassifier(estimator = DecisionTreeClassifier(max_depth = 1, max_leaf_nodes=2), 
                            algorithm = 'SAMME',n_estimators=rs, learning_rate=lr)
        boost.fit(X,y)
        ac = pd.concat([ac, pd.DataFrame([[rs, lr, boost.score(X,y) ]], 
                            columns=list(['Rounds','Learning Rate','Accuracy']))], ignore_index=True)

import seaborn as sns; sns.set()
import matplotlib.pyplot as plt
ax = sns.lineplot(x="Rounds", y="Accuracy", hue =ac['Learning Rate'].astype('category'),data=ac)

C:\Users\snguyen4\AppData\Local\Temp\ipykernel_25720\15604116.py:27: FutureWarning: The behavior of DataFrame concatenation with empty or all-NA entries is deprecated. In a future version, this will no longer exclude empty or all-NA columns when determining the result dtypes. To retain the old behavior, exclude the relevant entries before the concat operation.
  ac = pd.concat([ac, pd.DataFrame([[rs, lr, boost.score(X,y) ]],

x1 = np.array([1, 1, 2, 2, 3, 3, 3, 4, 5, 5, 4])
x2 = np.array([1, 3, 2, 4, 1, 2, 5, 4,   2, 5, 3])
y = np.array([ 1, 1,-1, 1,-1, -1, 1, 1,  -1,-1, 1])


X = np.vstack((x1,x2)).T
df = pd.DataFrame({'x1':x1, 'x2':x2, 'y':y})

ax = plt.gca()
cm_bright = ListedColormap(['#FF0000', '#0000FF'])
scatter_weights = np.ones(len(y))
ax.scatter(X[:,0],X[:,1], c = y, cmap = cm_bright, s = scatter_weights* 40)

ax.set_xlabel('$X_1$')
ax.set_ylabel('$X_2$')

ax

plt.figure()

ac = pd.DataFrame([], columns=list(['Rounds','Learning Rate','Accuracy']))
for rs in range(1, 50):
    for lr in [.05, 1, 2]:
        boost = AdaBoostClassifier(estimator = DecisionTreeClassifier(max_depth = 1, max_leaf_nodes=2), 
                            algorithm = 'SAMME',n_estimators=rs, learning_rate=lr)
        boost.fit(X,y)
        ac = pd.concat([ac, pd.DataFrame([[rs, lr, boost.score(X,y) ]], 
                            columns=list(['Rounds','Learning Rate','Accuracy']))], ignore_index=True)

import seaborn as sns; sns.set()
import matplotlib.pyplot as plt
ax = sns.lineplot(x="Rounds", y="Accuracy", hue =ac['Learning Rate'].astype('category'),data=ac)

C:\Users\snguyen4\AppData\Local\Temp\ipykernel_25720\1860051428.py:27: FutureWarning: The behavior of DataFrame concatenation with empty or all-NA entries is deprecated. In a future version, this will no longer exclude empty or all-NA columns when determining the result dtypes. To retain the old behavior, exclude the relevant entries before the concat operation.
  ac = pd.concat([ac, pd.DataFrame([[rs, lr, boost.score(X,y) ]],

adaboost_steps(df, L=1)

Voting Power of Stump 1: 0.752
Voting Power of Stump 2: 0.6264
Voting Power of Stump 3: 1.0601

#Toy Dataset
x1 = np.array([1, 1, 2, 2, 3, 3])
x2 = np.array([2, 1, 4, 5, 1, 2])
y = np.array([ 1, 1,-1, -1,1, -1])
X = np.vstack((x1,x2)).T
df = pd.DataFrame({'x1':x1, 'x2':x2, 'y':y})

adaboost_steps(df, L=1)

Voting Power of Stump 1: -0.8047
Voting Power of Stump 2: 1.0986
Voting Power of Stump 3: 0.226

	x1	x2	y	Stump 1	Weight 1	Weight 2	Stump 2	Weight 3	Stump 3
0	1	1	1	-1	0.090909	0.250000	1	0.160714	1
1	1	3	1	1	0.090909	0.055556	1	0.035714	1
2	2	2	-1	-1	0.090909	0.055556	-1	0.035714	1
3	2	4	1	1	0.090909	0.055556	-1	0.125000	1
4	3	1	-1	-1	0.090909	0.055556	-1	0.035714	1
5	3	2	-1	-1	0.090909	0.055556	-1	0.035714	1
6	3	5	1	1	0.090909	0.055556	-1	0.125000	1
7	4	4	1	1	0.090909	0.055556	-1	0.125000	1
8	5	2	-1	-1	0.090909	0.055556	-1	0.035714	-1
9	5	5	-1	1	0.090909	0.250000	-1	0.160714	-1
10	4	3	1	1	0.090909	0.055556	-1	0.125000	1

Define some functions¶

Define Data¶

Effect of Number of Rounds¶

Effect of Learning Rate¶

Tricky Data to Learn¶

Can Adaboost completely solve this?¶

Calculation¶

	x1	x2	y	Stump 1	Weight 1	Weight 2	Stump 2	Weight 3	Stump 3
0	1	2	1	-1	0.166667	0.1	1	0.055556	1
1	1	1	1	-1	0.166667	0.1	1	0.055556	1
2	2	4	-1	1	0.166667	0.1	-1	0.055556	1
3	2	5	-1	1	0.166667	0.1	-1	0.055556	1
4	3	1	1	-1	0.166667	0.1	-1	0.500000	1
5	3	2	-1	-1	0.166667	0.5	-1	0.277778	1