import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

from sklearn.datasets import make_blobs

inputs, targets = make_blobs(n_samples=1000, centers=[(-6,6), (-3,2), (-6,4)] , random_state=42)

# Centers is defining the center around which points will be centered - here we gave 3 so target will have 3 labels
# You can also write integer numbers to get desired labels, that is centers = 5 will give you 5 different labels
# You can control the number of features to include by n_features parameter

inputs[:2]

array([[-4.97593747,  4.59252695],
       [-4.33874079,  3.54290374]])

targets[:2]

array([2, 2])

inputs.shape   # 1000 rows and 2 coordinates x and y which is equivalent to 2 features

(1000, 2)

# Let's create a pandas dataframe with the newly created data points

data = pd.DataFrame(data = inputs, columns = ['feature1', 'feature2'])
data['target'] = targets

data.head()

data['target'].value_counts()

target
0    334
2    333
1    333
Name: count, dtype: int64

plt.figure(figsize = (14,5))
sns.set()
sns.scatterplot(x = 'feature1', y = 'feature2',
                data = data,
                hue = 'target',
                palette = ['#000172', '#287281', '#986732'],
                style = 'target',
                s = 60
               )
plt.show()

sns.set()
sns.jointplot(x = 'feature1', y = 'feature2',
              data = data,
              hue = 'target',
              palette = ['#000172', '#287281', '#986732'],
              height=6,
              s = 60
             )
plt.show()

from sklearn.model_selection import train_test_split

x_train, x_test, y_train, y_test = train_test_split(data.iloc[:, :-1], 
                                                    data.iloc[:, -1], 
                                                    test_size = 0.2, 
                                                    random_state=42)
x_train.shape, x_test.shape, y_train.shape, y_test.shape

((800, 2), (200, 2), (800,), (200,))

x_train.head(2)

from sklearn.neighbors import KNeighborsClassifier

# Let's instantiate the model with 1 neighbor at first
clf = KNeighborsClassifier(n_neighbors = 1)  # By default, the value of this parameter is 5

clf.fit(x_train, y_train)

KNeighborsClassifier(n_neighbors=1)

KNeighborsClassifier(n_neighbors=1)

samples = [[-3.6, 3], [-7.6, 1], [-2.15, 2.7]]
sample_set = pd.DataFrame(data = samples, columns=['feature1', 'feature2'])
sample_set

prediction = clf.predict(sample_set)
prediction

array([1, 2, 1])

neighbors = clf.kneighbors(sample_set)
neighbors

(array([[0.06855388],
        [0.44865184],
        [0.19497333]]),
 array([[750],
        [777],
        [509]], dtype=int64))

plt.figure(figsize = (14,5))
sns.set()
sns.scatterplot(x = x_train.iloc[:, 0], y = x_train.iloc[:, 1],
                hue = y_train,
                palette = ['#000172', '#287281', '#986732'],
                s = 60,
                legend = True
               )

sns.scatterplot(x = sample_set.iloc[:, 0], y = sample_set.iloc[:, 1],
                markers = ['o'],
                color = 'red',
                s = 30,
                legend = False
               )
    
plt.show()

clf.get_params()

{'algorithm': 'auto',
 'leaf_size': 30,
 'metric': 'minkowski',
 'metric_params': None,
 'n_jobs': None,
 'n_neighbors': 1,
 'p': 2,
 'weights': 'uniform'}

# Let's run the model code again

clf2 = KNeighborsClassifier(n_neighbors=1, weights='distance')
clf2.fit(x_train, y_train)

prediction2 = clf2.predict(sample_set)

clf2.get_params()

{'algorithm': 'auto',
 'leaf_size': 30,
 'metric': 'minkowski',
 'metric_params': None,
 'n_jobs': None,
 'n_neighbors': 1,
 'p': 2,
 'weights': 'distance'}

prediction2

array([1, 2, 1])

prediction

array([1, 2, 1])

from mlxtend.plotting import plot_decision_regions
import time

plot_decision_regions(X = np.array(x_train), 
                      y = np.array(y_train),
                      X_highlight = np.array(sample_set),
                      clf = clf2, 
                      scatter_kwargs= {'s':60, 'edgecolor':'white', 'alpha':0.5},
                      legend = True)  
# This function requires 2D array - (samples, features) and labels

plt.show()

E:\7. Deep Learning\venv\lib\site-packages\sklearn\base.py:493: UserWarning: X does not have valid feature names, but KNeighborsClassifier was fitted with feature names
  warnings.warn(

clf3 = KNeighborsClassifier(n_neighbors=30, weights='uniform')
clf3.fit(x_train, y_train)

prediction3 = clf3.predict(sample_set)

plot_decision_regions(X = np.array(x_train), 
                      y = np.array(y_train),
                      X_highlight = np.array(sample_set),
                      clf = clf3, 
                      scatter_kwargs= {'s':60, 'edgecolor':'white', 'alpha':0.5},
                      legend = True)

E:\7. Deep Learning\venv\lib\site-packages\sklearn\base.py:493: UserWarning: X does not have valid feature names, but KNeighborsClassifier was fitted with feature names
  warnings.warn(

<Axes: >

from sklearn.metrics import accuracy_score

error_uniform = []  # Stores error rates from models with uniformly distributed weights
error_distance = []   # Stores error rates from models with distance-based weights

for k in range(1,31):
    model = KNeighborsClassifier(n_neighbors=k, weights='uniform')
    model.fit(x_train, y_train)
    predictions = model.predict(x_test)
    error_uniform.append(1 - accuracy_score(y_test, predictions))

    model = KNeighborsClassifier(n_neighbors=k, weights='distance')
    model.fit(x_train, y_train)
    predictions = model.predict(x_test)
    error_distance.append(1 - accuracy_score(y_test, predictions))

# Let's plot now

plt.plot(range(1,31), error_uniform, c = 'red', linestyle = 'solid',
         marker = 'o', markerfacecolor = 'black', label = 'Error Uniform')
plt.plot(range(1,31), error_distance, c = 'purple', linestyle = '--',
         marker = 'o', markerfacecolor = 'white', label = 'Error Distance')
plt.legend()
plt.xlabel('K values')
plt.ylabel('Error rate')
plt.show()

from sklearn.model_selection import GridSearchCV

grid_params = {
    'n_neighbors' : range(1,31),
    'weights' : ['uniform', 'distance']
    }

gridcv = GridSearchCV(estimator = KNeighborsClassifier(),
                      param_grid=grid_params,
                      scoring='accuracy')

gridcv.fit(x_train, y_train)

GridSearchCV(estimator=KNeighborsClassifier(),
             param_grid={'n_neighbors': range(1, 31),
                         'weights': ['uniform', 'distance']},
             scoring='accuracy')

GridSearchCV(estimator=KNeighborsClassifier(),
             param_grid={'n_neighbors': range(1, 31),
                         'weights': ['uniform', 'distance']},
             scoring='accuracy')

KNeighborsClassifier(n_neighbors=8)

KNeighborsClassifier(n_neighbors=8)

gridcv.best_params_

{'n_neighbors': 8, 'weights': 'uniform'}

gridcv.best_estimator_

KNeighborsClassifier(n_neighbors=8)

KNeighborsClassifier(n_neighbors=8)

gridcv.best_score_   
# This number is a mean of all accuracies obtained during cross validation process

0.8625

clf = gridcv.best_estimator_
clf.fit(x_train, y_train)

KNeighborsClassifier(n_neighbors=8)

KNeighborsClassifier(n_neighbors=8)

predictions = clf.predict(x_test)

# Checking the score
accuracy_score(predictions, y_test)

0.86

from sklearn.metrics import classification_report, confusion_matrix

cnf_matrix = confusion_matrix(predictions, y_test)
cnf_matrix

array([[65,  0, 15],
       [ 1, 52,  3],
       [ 8,  1, 55]], dtype=int64)

plt.figure(figsize=(6, 5))
sns.heatmap(
    cnf_matrix,
    annot=True,               # Show numbers in cells
    fmt='d',                  # Format numbers as integers
    cmap='magma',
    xticklabels=clf.classes_,
    yticklabels=clf.classes_
)

plt.xlabel('Predicted Label')
plt.ylabel('True Label')
plt.title('Confusion Matrix')
plt.show()

print(classification_report(predictions, y_test))

              precision    recall  f1-score   support

           0       0.88      0.81      0.84        80
           1       0.98      0.93      0.95        56
           2       0.75      0.86      0.80        64

    accuracy                           0.86       200
   macro avg       0.87      0.87      0.87       200
weighted avg       0.87      0.86      0.86       200

from sklearn.datasets import make_regression

inputs, targets = make_regression(n_samples = 10, n_features= 1, noise = 6,
                                 random_state = 42)

# noise if to deviate the data point that is to introduce a bit of noise in linear data

plt.scatter(inputs, targets);

targets = targets/targets.max()

plt.scatter(inputs, targets);

from sklearn.neighbors import KNeighborsRegressor

reg_knn = KNeighborsRegressor(n_neighbors=1)
reg_knn

KNeighborsRegressor(n_neighbors=1)

KNeighborsRegressor(n_neighbors=1)

reg_knn.fit(inputs, targets)

KNeighborsRegressor(n_neighbors=1)

KNeighborsRegressor(n_neighbors=1)

x_pred = 0.53
y_pred = reg_knn.predict([[x_pred]])
y_pred

array([-0.08901495])

neighbors_reg = reg_knn.kneighbors([[x_pred]])
neighbors_reg

(array([[0.01256004]]), array([[5]], dtype=int64))

plt.scatter(inputs, targets)
plt.scatter(x_pred, y_pred);

y_pred, targets[5]  # They are almost the same

(array([-0.08901495]), -0.08901494592896088)

# Let's change k to 4 and see what we get

reg_knn = KNeighborsRegressor(n_neighbors=4)
reg_knn.fit(inputs, targets)

x_pred = 0.53
y_pred = reg_knn.predict([[x_pred]])

plt.scatter(inputs, targets)
plt.scatter(x_pred, y_pred);

neighbors = reg_knn.kneighbors([[x_pred]])
neighbors

(array([[0.01256004, 0.03328585, 0.11768854, 0.23743473]]),
 array([[5, 6, 9, 2]], dtype=int64))

(targets[5] + targets[6] + targets[9] + targets[2])/4

0.06162155187861659

y_pred

array([0.06162155])

inputs, targets = make_regression(n_samples = 500,
                                  n_features= 1,
                                  noise = 28,
                                  random_state=42)

targets = targets/targets.max()

plt.scatter(inputs, targets, color = '#934421')
plt.xlabel('Features')
plt.ylabel('Targets');

# Splitting the dataset

x_train, x_test, y_train, y_test = train_test_split(inputs, targets,
                                                    test_size=0.2, random_state=42)

fig = plt.figure(figsize=(14, 4))

ax1 = fig.add_subplot(1, 2, 1)
ax1.scatter(x_train, y_train, color='#934421')
ax1.set_title('Training Data')
ax1.set_xlabel('Features')
ax1.set_ylabel('Targets')

ax2 = fig.add_subplot(1, 2, 2)
ax2.scatter(x_test, y_test, color='#934421')
ax2.set_title('Test Data')
ax2.set_xlabel('Features')
ax2.set_ylabel('Targets')

plt.show()

from sklearn.linear_model import LinearRegression
from sklearn.neighbors import KNeighborsRegressor

grid_knn = GridSearchCV(estimator=KNeighborsRegressor(),
                       param_grid= {
                           'n_neighbors' : range(1,31),
                           'weights' : ['distance', 'uniform']
                       },
                       scoring='neg_mean_squared_error')

grid_knn.fit(x_train, y_train)

GridSearchCV(estimator=KNeighborsRegressor(),
             param_grid={'n_neighbors': range(1, 31),
                         'weights': ['distance', 'uniform']},
             scoring='neg_mean_squared_error')

GridSearchCV(estimator=KNeighborsRegressor(),
             param_grid={'n_neighbors': range(1, 31),
                         'weights': ['distance', 'uniform']},
             scoring='neg_mean_squared_error')

KNeighborsRegressor(n_neighbors=15)

KNeighborsRegressor(n_neighbors=15)

grid_knn.best_estimator_, grid_knn.best_score_

(KNeighborsRegressor(n_neighbors=15), -0.013154379819456791)

# Let's fit KNN Regressor model with this best estimator and initiate Linear Regression

reg_linear = LinearRegression()
reg_linear.fit(x_train, y_train)
linear_prediction = reg_linear.predict(x_test)

reg_knn = grid_knn.best_estimator_
reg_knn.fit(x_train, y_train)
knn_prediction = reg_knn.predict(x_test)

fig = plt.figure(figsize=(14, 4))

ax1 = fig.add_subplot(1, 2, 1)
ax1.scatter(x_test, y_test, color='#934421')
ax1.plot(x_test, linear_prediction)
ax1.set_title('Fit with Linear Regression')
ax1.set_xlabel('Features')
ax1.set_ylabel('Targets')

ax2 = fig.add_subplot(1, 2, 2)
ax2.scatter(x_test, y_test, color='#934421')
ax2.plot(x_test, knn_prediction)
ax2.set_title('Fit with KNN Regressor')
ax2.set_xlabel('Features')
ax2.set_ylabel('Targets')

plt.show()

y_pred_knn = []
for i in [1,10,40]:
    model = KNeighborsRegressor(n_neighbors=i)
    model.fit(x_train, y_train)
    y_pred_knn.append(model.predict(x_test))

df = pd.DataFrame(data = {
                        'x_test' : list(x_test.flatten()),
                        'y_test' : list(y_test.flatten()),
                        'y_pred_linear' : list(linear_prediction.flatten()),
                        'y_pred_knn_cv' : list(knn_prediction.flatten()),
                        'y_pred_knn_1' : list(y_pred_knn[0].flatten()),
                        'y_pred_knn_10' : list(y_pred_knn[1].flatten()),
                        'y_pred_knn_40' : list(y_pred_knn[2].flatten()),
                    }
                 )

df = df.sort_values(by = ['x_test'])
x_test_sorted = df['x_test'].to_list()
y_test_sorted = df['y_test'].to_list()
y_pred_linear_sorted = df['y_pred_linear'].to_list()
y_pred_knn_cv_sorted = df['y_pred_knn_cv'].to_list()
y_pred_knn_1_sorted = df['y_pred_knn_1'].to_list()
y_pred_knn_10_sorted = df['y_pred_knn_10'].to_list()
y_pred_knn_40_sorted = df['y_pred_knn_40'].to_list()

fig = plt.figure(figsize=(14, 4))

ax1 = fig.add_subplot(1, 2, 1)
ax1.scatter(x_test_sorted, y_test_sorted, color='#934421')
ax1.plot(x_test_sorted, y_pred_linear_sorted)
ax1.set_title('Fit with Linear Regression')
ax1.set_xlabel('Features')
ax1.set_ylabel('Targets');

fig = plt.figure(figsize=(21, 6))  

ax1 = fig.add_subplot(1, 3, 1)
ax1.scatter(x_test_sorted, y_test_sorted, color='#934421')
ax1.plot(x_test_sorted, y_pred_knn_1_sorted, color='blue')
ax1.set_title('KNN Regression (k=1)')
ax1.set_xlabel('Features')
ax1.set_ylabel('Targets')

ax2 = fig.add_subplot(1, 3, 2)
ax2.scatter(x_test_sorted, y_test_sorted, color='#934421')
ax2.plot(x_test_sorted, y_pred_knn_10_sorted, color='blue')
ax2.set_title('KNN Regression (k=10)')
ax2.set_xlabel('Features')
ax2.set_ylabel('Targets')

ax3 = fig.add_subplot(1, 3, 3)
ax3.scatter(x_test_sorted, y_test_sorted, color='#934421')
ax3.plot(x_test_sorted, y_pred_knn_40_sorted, color='blue')
ax3.set_title('KNN Regression (k=40)')
ax3.set_xlabel('Features')
ax3.set_ylabel('Targets')

plt.tight_layout()
plt.show()

fig = plt.figure(figsize=(14, 4))

ax1 = fig.add_subplot(1, 2, 1)
ax1.scatter(x_test_sorted, y_test_sorted, color='#934421')
ax1.plot(x_test_sorted, y_pred_knn_cv_sorted)
ax1.set_title('Fit with KNN Regression')
ax1.set_xlabel('Features')
ax1.set_ylabel('Targets');

from sklearn.metrics import mean_squared_error

linear_reg_error = mean_squared_error(y_test, linear_prediction)
knn_reg_error = mean_squared_error(y_test, knn_prediction)

linear_reg_error

0.010253765593013877

knn_reg_error

0.010670577903965932

from math import sin

# Create a function that generates a random non-linear dataset
def non_linear_regression(n_samples, noise = 0, random_state = None):
    
    if random_state:
        np.random.seed(random_state)

    uni = lambda n : np.random.uniform(-2, 2, n)
    add_noise =  lambda  n : np.random.normal(0, 1, n)
    
    x = []
    x = uni(n_samples)
    x.sort()
    
    y_raw = [i**2 + sin(5*i) for i in x]
    y = y_raw + noise * np.std(y_raw) * add_noise(n_samples)
        
    return x, y

# Generate data without noise
inputs_no_noise, target_no_noise = non_linear_regression(300, 0, 42)

# Using the same random state as above, generate the data with some noise
inputs, target = non_linear_regression(300, 0.5, 42)

sns.set()

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(13,4))

ax1.scatter(inputs_no_noise, target_no_noise, color = '#000C1F')
ax1.set_title('Data without noise')
ax1.set_xlabel('Feature')
ax1.set_ylabel('Target')

ax2.scatter(inputs, target, color = '#000C1F')
ax2.set_title('Data with noise')
ax2.set_xlabel('Feature')
ax2.set_ylabel('Target');

x_train, x_test, y_train, y_test = train_test_split(inputs, 
                                                    target, 
                                                    test_size = 0.2, 
                                                    random_state = 42)

sns.set()

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(13,4))

ax1.scatter(x_train, y_train, color = '#000C1F')
ax1.set_title('Training data')
ax1.set_xlabel('Feature')
ax1.set_ylabel('Target')

ax2.scatter(x_test, y_test, color = '#000C1F')
ax2.set_title('Test data')
ax2.set_xlabel('Feature')
ax2.set_ylabel('Target');

reg_lin = LinearRegression()


# In sklearn, when fitting data with only 1 feature, the following reshaping should be applied.
reg_lin.fit(x_train.reshape(-1, 1), y_train)
y_pred_lin = reg_lin.predict(x_test.reshape(-1, 1))

k = 81
mse_lin = []

# Calculate the MSE value for the linear regression
mse_lin = mean_squared_error(y_test, y_pred_lin)

# The MSE value calculated above is the same for all values of K. 
# Therefore, we create an array storing that MSE value (k-1) many times.
# This will later be used to plot the MSE value versus the number of nearest neighbors.
mse_lin = [mse_lin]*(k-1)


mse_knn = []
for i in range(1, k):
    reg_knn = KNeighborsRegressor(n_neighbors = i)
    reg_knn.fit(x_train.reshape(-1, 1), y_train)
    y_pred_knn = reg_knn.predict(x_test.reshape(-1, 1))
    mse_knn.append(mean_squared_error(y_test, y_pred_knn))

sns.set()

fig, ax = plt.subplots()

# Since the linear regression is not affected by the value of K, the output is a straight line.
plt.plot(list(range(1, k)), 
         mse_lin, 
         color = 'orange', 
         label = 'linear')

# Plot the MSE of the KNN regressions versus the value of K.
plt.plot(list(range(1, k)), 
         mse_knn, 
         color = 'red', 
         marker = 'o', 
         markerfacecolor = '#000C1F',
         label = 'KNN')

ax.legend(loc='lower right')
ax.set_title('Mean-Squared Error (MSE)')
ax.set_xlabel('K')
ax.set_ylabel('MSE')
plt.ylim(0);

# Create a list to store the predictions from 3 KNN regressions
y_pred_knn = []

# Create 3 KNN regressions with K = 1, 7, and 80.
for i in [1, 7, 80]:
    reg_knn = KNeighborsRegressor(n_neighbors = i)
    reg_knn.fit(x_train.reshape(-1, 1), y_train)
    y_pred_knn.append(reg_knn.predict(x_test.reshape(-1, 1)))

df = pd.DataFrame(data = {'x_test':list(x_test.flatten()), 
                          'y_test':list(y_test.flatten()), 
                          'y_pred_lin':list(y_pred_lin.flatten()), 
                          'y_pred_knn-1':list(y_pred_knn[0].flatten()), 
                          'y_pred_knn-7':list(y_pred_knn[1].flatten()), 
                          'y_pred_knn-80':list(y_pred_knn[2].flatten())})


df = df.sort_values(by = ['x_test'])

x_test_sorted = df['x_test'].tolist()
y_test_sorted = df['y_test'].tolist()
y_pred_lin_sorted = df['y_pred_lin'].tolist()
y_pred_knn1_sorted = df['y_pred_knn-1'].tolist()
y_pred_knn7_sorted = df['y_pred_knn-7'].tolist()
y_pred_knn80_sorted = df['y_pred_knn-80'].tolist()

sns.set()

fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(10,4))

ax1.scatter(x_test_sorted, 
            y_test_sorted, 
            color = '#000C1F')

ax1.plot(x_test_sorted, 
         y_pred_lin_sorted, 
         color = 'orange')

ax1.set_title('Linear fit on top of the test data')
ax1.set_xlabel('Feature')
ax1.set_ylabel('Target')

ax2.scatter(x_test_sorted, 
            y_test_sorted, 
            color = '#000C1F')

ax2.plot(x_test_sorted, 
         y_pred_knn7_sorted, 
         color = 'red', 
         marker = 'o', 
         markerfacecolor = 'yellow')

ax2.set_title('KNN fit on top of the test data (K = 7)')
ax2.set_xlabel('Feature')
ax2.set_ylabel('Target');

fig, (ax1,ax2, ax3) = plt.subplots(1,3, figsize=(16, 5))

# Plot the noiseless data on all 3 figures
ax1.scatter(inputs_no_noise, target_no_noise, color = '#000C1F')
ax2.scatter(inputs_no_noise, target_no_noise, color = '#000C1F')
ax3.scatter(inputs_no_noise, target_no_noise, color = '#000C1F')

# Plot the fit from a KNN regression (K = 1)
ax1.plot(x_test_sorted, 
         y_pred_knn1_sorted, 
         color = 'red',
         marker = 'o', 
         markerfacecolor = 'yellow')
ax1.set_title('K = 1')
ax1.set_xlabel('Feature')
ax1.set_ylabel('Target')

# Plot the fit from a KNN regression (K = 7)
ax2.plot(x_test_sorted, 
         y_pred_knn7_sorted, 
         color = 'red',
         marker = 'o', 
         markerfacecolor = 'yellow')
ax2.set_title('K = 7')
ax2.set_xlabel('Feature')
ax2.set_ylabel('Target')

# Plot the fit from a KNN regression (K = 80)
ax3.plot(x_test_sorted, 
         y_pred_knn80_sorted, 
         color = 'red',
         marker = 'o', 
         markerfacecolor = 'yellow')
ax3.set_title('K = 80')
ax3.set_xlabel('Feature')
ax3.set_ylabel('Target');

	feature1	feature2	target
0	-4.975937	4.592527	2
1	-4.338741	3.542904	2
2	-7.607483	6.184634	0
3	-4.923993	4.021312	2
4	-6.756351	4.577746	0

	feature1	feature2
29	-1.469249	3.218762
535	-6.883857	6.153725

Introduction to KNN¶

Distance Metric used in KNN¶

Why Does the Value of $p$ Matter in KNN?¶

Other Important Distance Metrics in KNN¶

KNN as a Classifier demo¶

Visualize the dataset¶

Splitting data into train and test¶

Building the model¶

Understanding decision boundaries¶

Getting error rates from a set of models¶

Using GridSearchCV¶

Evaluating Model performance¶

KNN as a Regressor demo¶

Comparison of KNN Regressor with Linear Regression¶

Cases when KNN Regressor can work better than Linear Regression¶

Deciding on using Distance Metric¶

Using GridSearchCV to select the best `p`¶

KNN Pros and Cons¶

KNN Classifier¶

KNN Regressor¶

KNN Classifier and Regressor – Drawbacks¶

	feature1	feature2
0	-3.60	3.0
1	-7.60	1.0
2	-2.15	2.7

Introduction to KNN¶

Distance Metric used in KNN¶

Why Does the Value of $p$ Matter in KNN?¶

Other Important Distance Metrics in KNN¶

KNN as a Classifier demo¶

Visualize the dataset¶

Splitting data into train and test¶

Building the model¶

Understanding decision boundaries¶

Getting error rates from a set of models¶

Using GridSearchCV¶

Evaluating Model performance¶

KNN as a Regressor demo¶

Comparison of KNN Regressor with Linear Regression¶

Cases when KNN Regressor can work better than Linear Regression¶

Deciding on using Distance Metric¶

Using GridSearchCV to select the best p¶

KNN Pros and Cons¶

KNN Classifier¶

KNN Regressor¶

KNN Classifier and Regressor – Drawbacks¶

Using GridSearchCV to select the best `p`¶