import numpy as np
from sklearn.neural_network import MLPRegressor
from sklearn.metrics import mean_absolute_error

### Toy data
a1 = 0.54
a2 = 0.36

N = 100

q1 = 2*np.pi*np.random.rand(N)
q2 = 2*np.pi*np.random.rand(N)
q3 = 2*np.pi*np.random.rand(N)

x_end = a1*np.cos(q1)*np.cos(q2) + a2*np.cos(q1)*np.cos(q2+q3)
y_end = a1*np.sin(q1)*np.cos(q2) + a2*np.sin(q1)*np.cos(q2+q3)
z_end = a1*np.sin(q2) + a2*np.sin(q2+q3)

X = np.concatenate([q1.reshape(-1,1), q2.reshape(-1,1), q3.reshape(-1,1)],axis=1)
y = np.concatenate([x_end.reshape(-1,1), y_end.reshape(-1,1), z_end.reshape(-1,1)],axis=1)

X[0]

array([4.37883903, 0.34684846, 0.29600127])

mlp_basic = MLPRegressor(hidden_layer_sizes=(100,))
mlp_basic.fit(X,y)

MLPRegressor()

MLPRegressor()

y_pred = mlp_basic.predict(X)

mean_absolute_error(y,y_pred)

np.float64(0.22263402192300832)

X = np.concatenate([q1.reshape(-1,1), q2.reshape(-1,1), q3.reshape(-1,1)],axis=1)
X_feng = np.concatenate([np.cos(X), np.sin(X)],axis=1)
X_feng[0]

array([-0.32739938,  0.9404487 ,  0.95651055, -0.94488605,  0.33993564,
        0.29169773])

mlp_feng = MLPRegressor(hidden_layer_sizes=(100,))
mlp_feng.fit(X_feng,y)

MLPRegressor()

MLPRegressor()

y_pred_feng = mlp_feng.predict(X_feng)

mean_absolute_error(y,y_pred_feng)

np.float64(0.08900489232278345)

q1r = q1.reshape(-1,1)
q2r = q2.reshape(-1,1)
q3r = q3.reshape(-1,1)
X = np.concatenate([q1r, q2r, q3r, q1r+q2r, q1r+q3r, q2r+q3r, q1r+q2r+q3r],axis=1)
X_feng = np.concatenate([np.cos(X), np.sin(X)],axis=1)

mlp_feng = MLPRegressor(hidden_layer_sizes=(100,))
mlp_feng.fit(X_feng,y)

MLPRegressor()

MLPRegressor()

y_pred_feng = mlp_feng.predict(X_feng)

mean_absolute_error(y,y_pred_feng)

np.float64(0.05849829170830978)

q1r = q1.reshape(-1,1)
q2r = q2.reshape(-1,1)
q3r = q3.reshape(-1,1)
X = np.concatenate([q1r, q2r, q3r, q1r+q2r, q1r+q3r, q2r+q3r, q1r+q2r+q3r, q1r-q2r, q1r-q3r, q2r-q3r, q1r-q2r+q3r, q1r+q2r-q3r, q1r-q2r-q3r],axis=1)
X_feng = np.concatenate([np.cos(X), np.sin(X)],axis=1)

mlp_feng = MLPRegressor(hidden_layer_sizes=(100,))
mlp_feng.fit(X_feng,y)

z_feng = mlp_feng.predict(X_feng)

mean_absolute_error(y,z_feng)

np.float64(0.04462438862429715)

mean_absolute_error(x_end + 1,np.ones_like(x_end)*np.mean(x_end+1))

np.float64(0.2360743314075817)

import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score

data = pd.read_csv('data/heart_disease.csv')
#data['target'] = data['target'].apply(lambda x: 0 if x == 0 else 1)
data.head()

X = data.drop('target', axis=1)
y = data['target']

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

model = RandomForestClassifier()
model.fit(X_train, y_train)

RandomForestClassifier()

RandomForestClassifier()

y_pred = model.predict(X_test)

model.score(X_test, y_test)

0.5081967213114754

accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy:.2f}")

Accuracy: 0.51

precision = precision_score(y_test, y_pred, average= 'micro')
print(f"Precision: {precision:.2f}")

Precision: 0.51

recall = recall_score(y_test, y_pred, average= 'micro')
print(f"Recall: {recall:.2f}")

Recall: 0.51

f1 = f1_score(y_test, y_pred, average= 'micro')
print(f"F1 Score: {f1:.2f}")

F1 Score: 0.51

y_pred_proba = model.predict_proba(X_test)

from sklearn.metrics import roc_auc_score
from sklearn.preprocessing import label_binarize
import numpy as np

# Binarize the output (One-vs-Rest approach)
classes = [0, 1, 2, 3, 4]
y_test_binarized = label_binarize(y_test, classes=classes)

# Compute the AUC for each class against the rest
roc_auc_ovr = roc_auc_score(y_test_binarized, y_pred_proba, multi_class='ovr')
print(f"One-vs-Rest ROC-AUC: {roc_auc_ovr:.2f}")

One-vs-Rest ROC-AUC: 0.79

import matplotlib.pyplot as plt
from sklearn.metrics import roc_curve

# Plot ROC for each class
for i, class_label in enumerate(classes):
    fpr, tpr, _ = roc_curve(y_test_binarized[:, i], y_pred_proba[:, i])
    plt.plot(fpr, tpr, label=f'Class {class_label} (AUC = {roc_auc_score(y_test_binarized[:, i], y_pred_proba[:, i]):.2f})')
    
plt.plot([0, 1], [0, 1], 'k--', label='Random Guessing')
plt.xlabel('False Positive Rate')
plt.ylabel('True Positive Rate')
plt.title('Multiclass ROC Curve')
plt.legend(loc='lower right')
plt.show()

# Compute the AUC using One-vs-One approach
roc_auc_ovo = roc_auc_score(y_test_binarized, y_pred_proba, multi_class='ovo')
print(f"One-vs-One ROC-AUC: {roc_auc_ovo:.2f}")

One-vs-One ROC-AUC: 0.79

	age	sex	cp	trestbps	chol	fbs	restecg	thalach	exang	oldpeak	slope	ca	thal	target
0	63.0	1.0	1.0	145.0	233.0	1.0	2.0	150.0	0.0	2.3	3.0	0.0	6.0	0
1	67.0	1.0	4.0	160.0	286.0	0.0	2.0	108.0	1.0	1.5	2.0	3.0	3.0	2
2	67.0	1.0	4.0	120.0	229.0	0.0	2.0	129.0	1.0	2.6	2.0	2.0	7.0	1
3	37.0	1.0	3.0	130.0	250.0	0.0	0.0	187.0	0.0	3.5	3.0	0.0	3.0	0
4	41.0	0.0	2.0	130.0	204.0	0.0	2.0	172.0	0.0	1.4	1.0	0.0	3.0	0

Lighthouse Labs

W9D4 - Applications of Machine Learning

Overview¶

Introduction to Machine Learning Applications¶

Choosing the right algorithm¶

Why Feature Engineering Matters?¶

Challenges for our robot arm:¶

Evaluation Metrics¶

The Story: Dr. Patel's Clinic¶

? What does that even mean?¶

Accuracy¶

Precision¶

Recall (Sensitivity)¶

F1 Score¶

ROC and AUC in Classification Models¶

Choosing the Right Approach¶

Metrics for Regression¶

$(R^2$ (Coefficient of Determination)¶

MSE (Mean Squared Error)¶

MAE (Mean Absolute Error)¶

2. RMSE (Root Mean Squared Error)¶

References:¶