import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt
from sklearn.metrics import ConfusionMatrixDisplay
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import classification_report, confusion_matrix, accuracy_score


sns.get_dataset_names()
dfi = sns.load_dataset('iris')
dfi.head()


sns.pairplot(dfi, hue='species', height = 1.5)

<seaborn.axisgrid.PairGrid at 0x7fdabe52f828>


# we want a binary classifier, so drop the virginica data
dfid = dfi[ (dfi['species'] != 'virginica') == True ]
# this leave just two classes.
sns.pairplot(dfid, hue='species', height = 1.0)

<seaborn.axisgrid.PairGrid at 0x7fdaca69bef0>


dfid.head()


# we use petal length and sepal width as our features
X = dfid.iloc[:,[1,2]].values
# and species as our label
y = dfid.iloc[:, 4].values


# let's plot them in different colours - find the species array index sets
indxS = np.where(y == 'setosa')[0]
indxV = np.where(y != 'setosa')[0]
ax = plt.figure(figsize=(4,4))
plt.scatter(X[indxS,0], X[indxS,1], color='blue')
plt.scatter(X[indxV,0], X[indxV,1], color='red')
plt.axis('equal'); plt.xlabel('sepal_width'); plt.ylabel('petal_length')

Text(0, 0.5, 'petal_length')


ax = plt.figure(figsize=(6,4))
plt.scatter(X[indxS,0], X[indxS,1], color='blue')
plt.scatter(X[indxV,0], X[indxV,1], color='red')
plt.axis('equal'); plt.xlabel('sepal_width'); plt.ylabel('petal_length')
plt.plot([1,5],[1,5],':m', label='line 1')
plt.plot([0,5],[1,3],':c', label='line 2')
plt.plot([2,4],[1,5],':g', label='line 3')
plt.legend()

<matplotlib.legend.Legend at 0x7fda99aa94e0>


ax = plt.figure(figsize=(6,4))
plt.scatter(X[indxS,0], X[indxS,1], color='blue')
plt.scatter(X[indxV,0], X[indxV,1], color='red')
plt.axis('equal'); plt.xlabel('sepal_width'); plt.ylabel('petal_length')
plt.plot([1,5],[1,5],':m', label='line 1')
plt.plot([0,5],[1,3],':c', label='line 2')
plt.plot([2,4],[1,5],':g', label='line 3')
plt.plot([0,5],[.85,3.55],'-.k', label='line 4')
plt.legend()

<matplotlib.legend.Legend at 0x7fdae9330198>


ax = plt.figure(figsize=(6,4))
plt.scatter(X[indxS,0], X[indxS,1], color='blue')
plt.scatter(X[indxV,0], X[indxV,1], color='red')
plt.axis('equal'); plt.xlabel('sepal_width'); plt.ylabel('petal_length')
plt.plot([0,5],[.85,3.55],':k')
plt.plot([0,5],[0.85+0.79,3.55+0.79],':k')
plt.plot([0,5],[0.85-0.79,3.55-0.79],':k')

[<matplotlib.lines.Line2D at 0x7fdaca2ae1d0>]


dfid.head(2)


# We'll use 50% of the data to test
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.50)


if False:
  scaler = StandardScaler()
  # initialise the scaler by feeding it the training data
  scaler.fit(X_train)
  # now carry out the transformation of all of the feature data
  X_train = scaler.transform(X_train)
  X_test  = scaler.transform(X_test)


# import the SVM classifier
from sklearn import svm
# instance it
svmclf = svm.SVC(kernel='linear')
# and fit the training data
svmclf.fit(X_train, y_train)

SVC(kernel='linear')


# make predictions on the test set
y_pred = svmclf.predict(X_test)


# get the confusion matrix and accuracy data
cm = confusion_matrix(y_test, y_pred)
print("Confusion Matrix:")
print(cm)
accsc = accuracy_score(y_test,y_pred)
print("Accuracy:", accsc)

Confusion Matrix:
[[25  0]
 [ 0 25]]
Accuracy: 1.0


# plot a nicer confusion matrix
cmplot = ConfusionMatrixDisplay(cm, display_labels=svmclf.classes_)
cmplot.plot()
plt.show()


indxS = np.where(y_train == 'setosa')[0]
indxV = np.where(y_train != 'setosa')[0]


plt.scatter(X_train[indxS,0], X_train[indxS,1], color='blue')
plt.scatter(X_train[indxV,0], X_train[indxV,1], color='red')
plt.axis('equal'); plt.xlabel('sepal_width'); plt.ylabel('petal_length');


# get support vectors
SVecs = svmclf.support_vectors_
print('The (transposed) support vectors are:\n', SVecs.T)
# get number of support vectors for each class
NumSVecs = svmclf.n_support_
print('There are these many per class', NumSVecs)

The (transposed) support vectors are:
 [[3.4 2.5]
 [1.9 3. ]]
There are these many per class [1 1]


plt.scatter(X_train[indxS,0], X_train[indxS,1], color='blue')
plt.scatter(X_train[indxV,0], X_train[indxV,1], color='red')
plt.axis('equal'); plt.xlabel('sepal_width'); plt.ylabel('petal_length');
# plot the support vectors
for k in range(NumSVecs.sum()):
  plt.plot([0,SVecs[k,0]],[0,SVecs[k,1]],'k')


# a x1 + b x2 + c = 0
a = svmclf.coef_[0,0]
b = svmclf.coef_[0,1]
c = svmclf.intercept_[0]
print(f'a={a}, b={b}, c={c}')

a=-0.8910889164381169, b=1.0891086756465878, c=-0.0396039140724227


P1 = np.array([0, -c/b]); P2=np.array([6, -(6*a + c)/b])


plt.scatter(X_train[indxS,0], X_train[indxS,1], color='blue')
plt.scatter(X_train[indxV,0], X_train[indxV,1], color='red')
plt.axis('equal'); plt.xlabel('sepal_width'); plt.ylabel('petal_length');
# plot the support vectors
for k in range(NumSVecs.sum()):
  plt.plot([0,SVecs[k,0]],[0,SVecs[k,1]],':k')
# the decision boundary
plt.plot([P1[0],P2[0]],[P1[1],P2[1]],'k')

[<matplotlib.lines.Line2D at 0x7fdac9bb9780>]


plt.scatter(X_train[indxS,0], X_train[indxS,1], color='blue')
plt.scatter(X_train[indxV,0], X_train[indxV,1], color='red')
plt.axis('equal'); plt.xlabel('sepal_width'); plt.ylabel('petal_length');
plt.plot([P1[0],P2[0]],[P1[1],P2[1]],'k')
for k in range(NumSVecs.sum()):
  plt.plot([0,SVecs[k,0]],[0,SVecs[k,1]],':k')
  q = np.array([SVecs[k,0],SVecs[k,1]])
  cq = -a*q[0]-b*q[1]; P1[1]=-(0*a + cq)/b; P2[1]=-(6*a + cq)/b
  plt.plot([P1[0],P2[0]],[P1[1],P2[1]],'k')


indxS = np.where(y_pred == 'setosa')[0]
indxV = np.where(y_pred != 'setosa')[0]
P1 = np.array([0, -c/b]); P2=np.array([6, -(6*a + c)/b])


plt.scatter(X_test[indxS,0], X_test[indxS,1], color='blue')
plt.scatter(X_test[indxV,0], X_test[indxV,1], color='red')
plt.axis('equal'); plt.xlabel('sepal_width'); plt.ylabel('petal_length');
plt.plot([P1[0],P2[0]],[P1[1],P2[1]],'k')
for k in range(NumSVecs.sum()):
  plt.plot([0,SVecs[k,0]],[0,SVecs[k,1]],':k')
  q = np.array([SVecs[k,0],SVecs[k,1]])
  cq = -a*q[0]-b*q[1]; P1[1]=-(0*a + cq)/b; P2[1]=-(6*a + cq)/b
  plt.plot([P1[0],P2[0]],[P1[1],P2[1]],'k')


sns.pairplot(dfid, hue='species', height = 1.0)

<seaborn.axisgrid.PairGrid at 0x7fdaca7eac50>


dfid.head(2)


# we use sepal length and sepal width as our features
X = dfid.iloc[:,[1,0]].values
# and species as our label
y = dfid.iloc[:, 4].values

# We'll use 50% of the data to test
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.50)

# instance the SVM - C affects the 'goodness' of the decision boundary
svmclf = svm.SVC(kernel='linear', C=100)
# and fit the training data
svmclf.fit(X_train, y_train)

# make predictions on the test set
y_pred = svmclf.predict(X_test)


# get the confusion matrix and accuracy data
cm = confusion_matrix(y_test, y_pred)
print("Confusion Matrix:")
print(cm)
accsc = accuracy_score(y_test,y_pred)
print("Accuracy:", accsc)

Confusion Matrix:
[[24  0]
 [ 0 26]]
Accuracy: 1.0


# plot a nicer confusion matrix
cmplot = ConfusionMatrixDisplay(cm, display_labels=svmclf.classes_)
cmplot.plot()
plt.show()


indxS = np.where(y_train == 'setosa')[0]
indxV = np.where(y_train != 'setosa')[0]
# get support vectors and number of them for each class
NumSVecs = svmclf.n_support_
print('There are these many per class', NumSVecs)
SVecs = svmclf.support_vectors_
print('The transposed support vectors are:\n', SVecs.T)

There are these many per class [2 1]
The transposed support vectors are:
 [[3.  2.3 2.7]
 [5.  4.5 5.2]]


# a x1 + b x2 + c = 0 => x2 = -(a x1 + c)/b
print('svmclf.intercept_ = ', svmclf.intercept_.shape)
a = svmclf.coef_[0,0]
b = svmclf.coef_[0,1]
c = svmclf.intercept_[0]
print(f'a={a}, b={b}, c={c}')

P1 = np.array([2, -(2*a + c)/b]); P2=np.array([4, -(4*a + c)/b])
print('P1 = ', P1, ', P2 = ', P2)

svmclf.intercept_ =  (1,)
a=-3.4474171551963138, b=4.827039147149825, c=-14.792726635865433
P1 =  [2.         4.49293248] , P2 =  [4.         5.92131002]


# plot the training data with the support vectors
plt.figure(figsize=(5,5));
plt.scatter(X_train[indxS,0], X_train[indxS,1], color='blue')
plt.scatter(X_train[indxV,0], X_train[indxV,1], color='red')
plt.axis('equal'); plt.xlabel('sepal_width'); plt.ylabel('petal_length');
# plot the support vectors in black - stemming form the origin
for k in range(NumSVecs.sum()):
  plt.plot([0,SVecs[k,0]],[0,SVecs[k,1]],'k')
plt.xlim(2,5); plt.ylim(4,7)

(4.0, 7.0)


# plot training data with decision boundary
plt.figure(figsize=(5,5))
plt.scatter(X_train[indxS,0], X_train[indxS,1], color='blue')
plt.scatter(X_train[indxV,0], X_train[indxV,1], color='red')
plt.axis('equal'); plt.xlabel('sepal_width'); plt.ylabel('petal_length');
plt.plot([P1[0],P2[0]],[P1[1],P2[1]],'k')
#plt.plot(xx, yy, "y-")

[<matplotlib.lines.Line2D at 0x7fdabea12048>]


indxS = np.where(y_pred == 'setosa')[0]
indxV = np.where(y_pred != 'setosa')[0]
P1 = np.array([2, -(2*a + c)/b]); P2=np.array([4, -(4*a + c)/b])


# test data with predictions and decision boundary
plt.figure(figsize=(5,5))
plt.scatter(X_test[indxS,0], X_test[indxS,1], color='blue')
plt.scatter(X_test[indxV,0], X_test[indxV,1], color='red')
plt.axis('equal'); plt.xlabel('sepal_width'); plt.ylabel('petal_length');
plt.plot([P1[0],P2[0]],[P1[1],P2[1]],'k')

[<matplotlib.lines.Line2D at 0x7fdae9466f60>]

	sepal_length	sepal_width	petal_length	petal_width	species
0	5.1	3.5	1.4	0.2	setosa
1	4.9	3.0	1.4	0.2	setosa
2	4.7	3.2	1.3	0.2	setosa
3	4.6	3.1	1.5	0.2	setosa
4	5.0	3.6	1.4	0.2	setosa

	sepal_length	sepal_width	petal_length	petal_width	species
0	5.1	3.5	1.4	0.2	setosa
1	4.9	3.0	1.4	0.2	setosa
2	4.7	3.2	1.3	0.2	setosa
3	4.6	3.1	1.5	0.2	setosa
4	5.0	3.6	1.4	0.2	setosa

	sepal_length	sepal_width	petal_length	petal_width	species
0	5.1	3.5	1.4	0.2	setosa
1	4.9	3.0	1.4	0.2	setosa

	sepal_length	sepal_width	petal_length	petal_width	species
0	5.1	3.5	1.4	0.2	setosa
1	4.9	3.0	1.4	0.2	setosa

Support Vector Machines¶

variationalform https://variationalform.github.io/¶

Just Enough: progress at pace¶

What this is about:¶

Context¶

Maximum Margin¶

The General Set-Up¶

Points, Lines, Planes and Hyperplanes¶

Optimization Problem¶

SVM using `sklearn`¶

Review¶

Next...¶

Support Vector Machines¶

variationalform https://variationalform.github.io/¶

Just Enough: progress at pace¶

What this is about:¶

Context¶

Maximum Margin¶

The General Set-Up¶

Points, Lines, Planes and Hyperplanes¶

Optimization Problem¶

SVM using sklearn¶

Review¶

Next...¶

SVM using `sklearn`¶