import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.tree import DecisionTreeClassifier

# Simulate dataset with 20 samples, 6 features, and binary target
np.random.seed(42)
X = pd.DataFrame(np.random.randn(20, 6), columns=[f'F{i+1}' for i in range(6)])
y = np.random.choice([0, 1], size=20)
sample_weights = np.ones(len(y)) / len(y)  # Equal initial weights

# Train decision stumps on each feature and record weighted errors
errors = {}
thresholds = {}
best_thresholds = {}

for feature in X.columns:
    min_error = float('inf')
    best_thresh = None

    # Try different thresholds based on unique values in feature
    for thresh in np.unique(X[feature]):
        # Predict using threshold rule
        preds = (X[feature] < thresh).astype(int)  # classify 1 if value < threshold
        incorrect = (preds != y)
        weighted_error = np.sum(sample_weights * incorrect)

        if weighted_error < min_error:
            min_error = weighted_error
            best_thresh = thresh

    errors[feature] = min_error
    thresholds[feature] = best_thresh

# Find best feature-threshold combination
best_feature = min(errors, key=errors.get)
best_thresh = thresholds[best_feature]
best_error = errors[best_feature]

# Visualization
fig, ax = plt.subplots(figsize=(10, 5))
ax.bar(errors.keys(), errors.values(), color='skyblue')
ax.set_title("Weighted Classification Errors for Decision Stumps")
ax.set_ylabel("Weighted Error")
ax.axhline(best_error, color='red', linestyle='--', label=f"Best Split: {best_feature} < {best_thresh:.2f}")
ax.legend()

best_feature, best_thresh, best_error

('F3', -1.1063349740060282, 0.35)

import numpy as np
import matplotlib.pyplot as plt

# Define 10 data points with initial weights
n_samples = 10
initial_weight = 1 / n_samples
weights = np.full(n_samples, initial_weight)

# Assume the true labels and predictions of weak learners
true_labels = np.array([1, 1, -1, 1, -1, 1, -1, 1, 1, -1])  # Labels in {-1, +1}
# Predictions by each weak learner
h1_pred = np.array([1, 1, 1, 1, -1, 1, 1, 1, 1, -1])
h2_pred = np.array([1, 1, -1, 1, -1, 1, -1, 1, 1, -1])
h3_pred = np.array([-1, -1, -1, 1, -1, 1, -1, 1, 1, -1])

# Assume error rates for each learner
errors = np.array([0.3, 0.2, 0.25])
alphas = 0.5 * np.log((1 - errors) / errors)

# Compute final prediction
def final_prediction(x1, x2, x3, a1, a2, a3):
    vote = a1 * x1 + a2 * x2 + a3 * x3
    return np.sign(vote), vote

# Compute predictions and weighted votes
final_preds = []
weighted_votes = []
for i in range(n_samples):
    pred, vote = final_prediction(h1_pred[i], h2_pred[i], h3_pred[i], alphas[0], alphas[1], alphas[2])
    final_preds.append(pred)
    weighted_votes.append(vote)

# Visualize
plt.figure(figsize=(10, 6))
colors = ['green' if p == 1 else 'red' for p in final_preds]
plt.bar(range(1, n_samples+1), weighted_votes, color=colors)
plt.axhline(0, color='black', linestyle='--')
plt.xlabel('Sample Index')
plt.ylabel('Weighted Vote')
plt.title('Final AdaBoost Prediction (Green = +1, Red = -1)')
plt.show()

final_preds

[1.0, 1.0, -1.0, 1.0, -1.0, 1.0, -1.0, 1.0, 1.0, -1.0]

from sklearn.ensemble import AdaBoostClassifier
from sklearn.tree import DecisionTreeClassifier

clf = AdaBoostClassifier(
    DecisionTreeClassifier(max_depth=1),
    n_estimators=50,
    algorithm='SAMME',  
    learning_rate=1.0
)
clf.fit(X_train, y_train)

from sklearn.ensemble import AdaBoostClassifier
from sklearn.tree import DecisionTreeClassifier
from sklearn.datasets import make_classification
from sklearn.model_selection import train_test_split
import matplotlib.pyplot as plt
import numpy as np

# Create toy dataset
X, y = make_classification(n_samples=100, n_features=2, n_informative=2,
                           n_redundant=0, n_clusters_per_class=1, random_state=42)
y = np.where(y == 0, -1, 1)  # AdaBoost often assumes -1, 1


clf = AdaBoostClassifier(DecisionTreeClassifier(max_depth=1),
                         n_estimators=10, learning_rate=1.0, algorithm='SAMME')

clf.fit(X, y)

AdaBoostClassifier(algorithm='SAMME',
                   estimator=DecisionTreeClassifier(max_depth=1),
                   n_estimators=10)

AdaBoostClassifier(algorithm='SAMME',
                   estimator=DecisionTreeClassifier(max_depth=1),
                   n_estimators=10)

DecisionTreeClassifier(max_depth=1)

DecisionTreeClassifier(max_depth=1)

def plot_boundary(model, X, y):
    x_min, x_max = X[:, 0].min() - 1, X[:, 0].max() + 1
    y_min, y_max = X[:, 1].min() - 1, X[:, 1].max() + 1
    xx, yy = np.meshgrid(np.linspace(x_min, x_max, 500),
                         np.linspace(y_min, y_max, 500))
    Z = model.predict(np.c_[xx.ravel(), yy.ravel()])
    Z = Z.reshape(xx.shape)

    plt.figure(figsize=(8, 6))
    plt.contourf(xx, yy, Z, alpha=0.3)
    plt.scatter(X[:, 0], X[:, 1], c=y, cmap='bwr', edgecolor='k')
    plt.title("AdaBoost Decision Boundary")
    plt.xlabel("Feature 1")
    plt.ylabel("Feature 2")
    plt.show()

plot_boundary(clf, X, y)

from sklearn.ensemble import AdaBoostClassifier
from sklearn.svm import SVC
from sklearn.datasets import load_wine
from sklearn import metrics

datasets = load_wine()

inputs, targets = datasets.data, datasets.target

targets

array([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
       0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
       0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1,
       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2,
       2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
       2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
       2, 2])

svc = SVC(probability=True, kernel='linear')

# Create adaboost classifer object with svc as base learner
abc = AdaBoostClassifier(n_estimators=50, estimator=svc,learning_rate=1,algorithm='SAMME')

from sklearn.model_selection import train_test_split

x_train, x_test, y_train, y_test = train_test_split(inputs, targets, test_size=0.1, random_state=42, stratify=targets)

model = abc.fit(x_train, y_train)

y_pred = model.predict(x_test)
print("Accuracy:",metrics.accuracy_score(y_test, y_pred))

Accuracy: 0.9444444444444444

Sample	Misclassified	Weight w₁
1	No	0.0715
2	No	0.0715
3	Yes	0.1666
4	No	0.0715
5	No	0.0715
6	No	0.0715
7	Yes	0.1666
8	No	0.0715
9	No	0.0715
10	Yes	0.1666

Sample	Correct?	w₁	New w₂ (before normalization)
1	Yes	0.0715	0.0715 × 0.408 ≈ 0.0292
2	No	0.0715	0.0715 × 2.19 ≈ 0.1567
3	Yes	0.1666	0.1666 × 0.408 ≈ 0.0679
4	Yes	0.0715	0.0715 × 0.408 ≈ 0.0292
5	No	0.0715	0.0715 × 2.19 ≈ 0.1567
6	Yes	0.0715	0.0715 × 0.408 ≈ 0.0292
7	Yes	0.1666	0.1666 × 0.408 ≈ 0.0679
8	Yes	0.0715	0.0715 × 0.408 ≈ 0.0292
9	Yes	0.0715	0.0715 × 0.408 ≈ 0.0292
10	Yes	0.1666	0.1666 × 0.408 ≈ 0.0679

Detail on AdaBoost - Adaptive Boosting¶

Understanding concept of Boosting¶

AdaBoost: Adaptive Boosting¶

Theoretical Understanding of how AdaBoost works¶

Initial Setup¶

Iterative Model Training¶

Classifier Weighting¶

Weight Update for Data Points¶

Repeating the Process¶

Final Prediction¶

Importance of Features in AdaBoost¶

What Happens to Features?¶

Python Example explaining the scenario¶

What Changes in Multiclass Classification?¶

1. One-vs-All AdaBoost (OVA)¶

2. SAMME (Stagewise Additive Modeling using a Multiclass Exponential loss function)¶

3. SAMME.R (Real variant)¶

Example: Multiclass with 3 Classes and 6 Features¶

Training with SAMME:¶

Hyperparameters of AdaBoost¶

1. n_estimators¶

2. learning_rate¶

3. base_estimator¶

4. algorithm¶

Pros and Cons of AdaBoost¶

Pros¶

Cons¶

When to Use AdaBoost¶

Why Other Boosting Methods Exist¶

Gradient Boosting¶

XGBoost¶

LightGBM¶

CatBoost¶

Intuition Behind the Formulation of AdaBoost¶

The Question AdaBoost Answers:¶

Explaining AdaBoost with Example¶

Step 0: Initial Setup¶

Round 1¶

Train First Weak Learner (h₁)¶

Compute Learner Weight (α₁)¶

Update Weights¶

Normalize Weights¶

Updated Weights After Round 1¶

Round 2¶

Train Second Weak Learner (h₂)¶

Compute Learner Weight (α₂)¶

Update Weights¶

Calculate Unnormalized Weights¶

Round 3¶

Final Prediction¶

Python Example¶

Variants of AdaBoost¶

Discrete AdaBoost¶

LogitBoost¶

SAMME / SAMME.R for Multiclass¶

Coding AdaBoost Classifier¶

Coding AdaBoost with different Base Learner¶

1. `n_estimators`¶

2. `learning_rate`¶

3. `base_estimator`¶

4. `algorithm`¶