空间站广场

论文

Notebooks

比赛

课程

Apps

我的主页

我的Notebooks

我的论文库

我的足迹

我的工作空间

任务

节点

文件

数据集

镜像

项目

数据库

公开

Lab 03 : Kernel/Non-Linear SVM

Machine Learning

xuxh@dp.tech

更新于 2024-10-15

推荐镜像 :Basic Image:bohrium-notebook:2023-04-07

推荐机型 :c2_m4_cpu

Lecture : Graph SVM

Lab 03 : Kernel/Non-Linear SVM

Xavier Bresson

Non-linearly separable data points

Run soft-margin SVM

Run kernel SVM

Real-world graph of articles

Run linear SVM

Run kernel SVM

Lecture : Graph SVM

Lab 03 : Kernel/Non-Linear SVM

Xavier Bresson

代码

文本

[1]

# For Google Colaboratory

import sys, os

if 'google.colab' in sys.modules:

# mount google drive

from google.colab import drive

drive.mount('/content/gdrive')

path_to_file = '/content/gdrive/My Drive/GML2023_codes/codes/04_Graph_SVM'

print(path_to_file)

# change current path to the folder containing "path_to_file"

os.chdir(path_to_file)

!pwd

代码

文本

[2]

# Load libraries

import numpy as np

import scipy.io

%matplotlib inline

#%matplotlib notebook

from matplotlib import pyplot

import matplotlib.pyplot as plt

from IPython.display import display, clear_output

plt.rcParams.update({'figure.max_open_warning': 0})

import time

import sys; sys.path.insert(0, 'lib/')

from lib.utils import compute_purity

from lib.utils import compute_SVM

import warnings; warnings.filterwarnings("ignore")

import sklearn.metrics.pairwise

代码

文本

Non-linearly separable data points

代码

文本

[3]

# Dataset

mat = scipy.io.loadmat('datasets/data_twomoons_kernelSVM.mat')

Xtrain = mat['Xtrain']

Cgt_train = mat['C_train_errors'] - 1; Cgt_train = Cgt_train.squeeze()

l_train = mat['l'].squeeze()

n = Xtrain.shape[0]

d = Xtrain.shape[1]

nc = len(np.unique(Cgt_train))

print(n,d,nc)

Xtest = mat['Xtest']

Cgt_test = mat['Cgt_test'] - 1; Cgt_test = Cgt_test.squeeze()

500 100 2

代码

文本

[4]

# Plot

plt.figure(figsize=(10,4))

p1 = plt.subplot(121)

size_vertex_plot = 33

plt.scatter(Xtrain[:,0], Xtrain[:,1], s=size_vertex_plot*np.ones(n), c=Cgt_train, color=pyplot.jet())

plt.title('Training Data with 25% ERRORS')

p2 = plt.subplot(122)

size_vertex_plot = 33

plt.scatter(Xtest[:,0], Xtest[:,1], s=size_vertex_plot*np.ones(n), c=Cgt_test, color=pyplot.jet())

plt.title('Test Data')

#plt.tight_layout()

plt.show()

<Figure size 1000x400 with 2 Axes>

代码

文本

Run soft-margin SVM

代码

文本

[5]

# Run soft-margin SVM

# Compute linear kernel, L, Q

Ker = Xtrain.dot(Xtrain.T)

l = l_train

L = np.diag(l)

Q = L.dot(Ker.dot(L))

# Time steps

tau_alpha = 10/ np.linalg.norm(Q,2)

tau_beta = 0.1/ np.linalg.norm(L,2)

# For conjuguate gradient

Acg = tau_alpha* Q + np.eye(n)

# Pre-compute J.K(Xtest) for test data

LKXtest = L.dot(Xtrain.dot(Xtest.T))

# Error parameter

lamb = 0.1 # acc: 83%

# Initialization

alpha = np.zeros([n])

beta = 0.0

alpha_old = alpha

# Loop

k = 0

diff_alpha = 1e6

num_iter = 201

while (diff_alpha>1e-3) & (k<num_iter):

# Update iteration

k += 1

# Update alpha

# Approximate solution with conjuguate gradient

b0 = alpha + tau_alpha - tau_alpha* l* beta

alpha, _ = scipy.sparse.linalg.cg(Acg, b0, x0=alpha, tol=1e-3, maxiter=50)

alpha[alpha<0.0] = 0 # Projection on [0,+infty]

alpha[alpha>lamb] = lamb # Projection on [-infty,lamb]

# Update beta

beta = beta + tau_beta* l.T.dot(alpha)

# Stopping condition

diff_alpha = np.linalg.norm(alpha-alpha_old)

alpha_old = alpha

# Plot

if not(k%10) or (diff_alpha<1e-3):

# Indicator function of support vectors

idx = np.where( np.abs(alpha)>0.25* np.max(np.abs(alpha)) )

Isv = np.zeros([n]); Isv[idx] = 1

nb_sv = len(Isv.nonzero()[0])

# Offset

if nb_sv > 1:

b = (Isv.T).dot( l - Ker.dot(L.dot(alpha)) )/ nb_sv

else:

b = 0

# Continuous score function

f_test = alpha.T.dot(LKXtest) + b

# Binary classification function

C_test = np.sign(f_test) # decision function in {-1,1}

accuracy_test = compute_purity(0.5*(1+C_test),Cgt_test,nc) # 0.5*(1+C_test) in {0,1}

# Plot

size_vertex_plot = 33

plt.figure(figsize=(12,4))

p1 = plt.subplot(121)

plt.scatter(Xtest[:,0], Xtest[:,1], s=size_vertex_plot*np.ones(n), c=f_test, color=pyplot.jet())

plt.title('Score function $s(x)=w^Tx+b$ \n iter=' + str(k)+ ', diff_alpha=' + str(diff_alpha)[:7])

plt.colorbar()

p2 = plt.subplot(122)

plt.scatter(Xtest[:,0], Xtest[:,1], s=size_vertex_plot*np.ones(n), c=C_test, color=pyplot.jet())

plt.title('Classification function $f(x)=sign(w^Tx+b)$\n iter=' + str(k) + ', acc=' + str(accuracy_test)[:5])

#plt.tight_layout()

plt.colorbar()

plt.show()

if k<num_iter-1:

clear_output(wait=True)

<Figure size 1200x400 with 4 Axes>

代码

文本

Run kernel SVM

代码

文本

[6]

# Run kernel SVM

# Compute Gaussian kernel, L, Q

sigma = 0.5; sigma2 = sigma**2

Ddist = sklearn.metrics.pairwise.pairwise_distances(Xtrain, Xtrain, metric='euclidean', n_jobs=1)

Ker = np.exp(- Ddist**2 / sigma2)

Ddist = sklearn.metrics.pairwise.pairwise_distances(Xtrain, Xtest, metric='euclidean', n_jobs=1)

KXtest = np.exp(- Ddist**2 / sigma2)

l = l_train

L = np.diag(l)

Q = L.dot(Ker.dot(L))

# Time steps

tau_alpha = 10/ np.linalg.norm(Q,2)

tau_beta = 0.1/ np.linalg.norm(L,2)

# For conjuguate gradient

Acg = tau_alpha* Q + np.eye(n)

# Pre-compute J.K(Xtest) for test data

LKXtest = L.dot(KXtest)

# Error parameter

lamb = 3 # acc: 95.4

# Initialization

alpha = np.zeros([n])

beta = 0.0

alpha_old = alpha

# Loop

k = 0

diff_alpha = 1e6

num_iter = 201

while (diff_alpha>1e-3) & (k<num_iter):

# Update iteration

k += 1

# Update alpha

# Approximate solution with conjuguate gradient

b0 = alpha + tau_alpha - tau_alpha* l* beta

alpha, _ = scipy.sparse.linalg.cg(Acg, b0, x0=alpha, tol=1e-3, maxiter=50)

alpha[alpha<0.0] = 0 # Projection on [0,+infty]

alpha[alpha>lamb] = lamb # Projection on [-infty,lamb]

# Update beta

beta = beta + tau_beta* l.T.dot(alpha)

# Stopping condition

diff_alpha = np.linalg.norm(alpha-alpha_old)

alpha_old = alpha

# Plot

if not(k%10) or (diff_alpha<1e-3):

# Indicator function of support vectors

idx = np.where( np.abs(alpha)>0.25* np.max(np.abs(alpha)) )

Isv = np.zeros([n]); Isv[idx] = 1

nb_sv = len(Isv.nonzero()[0])

# Offset

if nb_sv > 1:

b = (Isv.T).dot( l - Ker.dot(L.dot(alpha)) )/ nb_sv

else:

b = 0

# Continuous score function

f_test = alpha.T.dot(LKXtest) + b

# Binary classification function

C_test = np.sign(f_test) # decision function in {-1,1}

accuracy_test = compute_purity(0.5*(1+C_test),Cgt_test,nc) # 0.5*(1+C_test) in {0,1}

# Plot

size_vertex_plot = 33

plt.figure(figsize=(12,4))

p1 = plt.subplot(121)

plt.scatter(Xtest[:,0], Xtest[:,1], s=size_vertex_plot*np.ones(n), c=f_test, color=pyplot.jet())

plt.title('Score function $s(x)=w^T\phi(x)+b$ \n iter=' + str(k)+ ', diff_alpha=' + str(diff_alpha)[:7])

plt.colorbar()

p2 = plt.subplot(122)

plt.scatter(Xtest[:,0], Xtest[:,1], s=size_vertex_plot*np.ones(n), c=C_test, color=pyplot.jet())

plt.title('Classification function $f(x)=sign(w^T\phi(x)+b)$\n iter=' + str(k) + ', acc=' + str(accuracy_test)[:5])

#plt.tight_layout()

plt.colorbar()

plt.show()

if k<num_iter-1:

clear_output(wait=True)

<Figure size 1200x400 with 4 Axes>

代码

文本

Real-world graph of articles

代码

文本

[7]

# Dataset

mat = scipy.io.loadmat('datasets/data_20news_50labels.mat')

Xtrain = mat['Xtrain']

l_train = mat['l'].squeeze()

n = Xtrain.shape[0]

d = Xtrain.shape[1]

nc = len(np.unique(Cgt_train))

print(n,d,nc)

Xtest = mat['Xtest']

Cgt_test = mat['Cgt_test'] - 1; Cgt_test = Cgt_test.squeeze()

50 3684 2

代码

文本

Run linear SVM

代码

文本

[8]

# Run linear SVM

# Compute Gaussian kernel, L, Q

Ker = sklearn.metrics.pairwise.pairwise_distances(Xtrain, Xtrain, metric='euclidean', n_jobs=1)

KXtest = sklearn.metrics.pairwise.pairwise_distances(Xtrain, Xtest, metric='euclidean', n_jobs=1)

l = l_train

L = np.diag(l)

Q = L.dot(Ker.dot(L))

# Time steps

tau_alpha = 10/ np.linalg.norm(Q,2)

tau_beta = 0.1/ np.linalg.norm(L,2)

# For conjuguate gradient

Acg = tau_alpha* Q + np.eye(n)

# Pre-compute J.K(Xtest) for test data

LKXtest = L.dot(KXtest)

# Error parameter

lamb = 3 # acc: 83.5

# Initialization

alpha = np.zeros([n])

beta = 0.0

alpha_old = alpha

# Loop

k = 0

diff_alpha = 1e6

num_iter = 201

while (diff_alpha>1e-3) & (k<num_iter):

# Update iteration

k += 1

# Update alpha

# Approximate solution with conjuguate gradient

b0 = alpha + tau_alpha - tau_alpha* l* beta

alpha, _ = scipy.sparse.linalg.cg(Acg, b0, x0=alpha, tol=1e-3, maxiter=50)

alpha[alpha<0.0] = 0 # Projection on [0,+infty]

alpha[alpha>lamb] = lamb # Projection on [-infty,lamb]

# Update beta

beta = beta + tau_beta* l.T.dot(alpha)

# Stopping condition

diff_alpha = np.linalg.norm(alpha-alpha_old)

alpha_old = alpha

# Plot

if not(k%10) or (diff_alpha<1e-3):

# Indicator function of support vectors

idx = np.where( np.abs(alpha)>0.25* np.max(np.abs(alpha)) )

Isv = np.zeros([n]); Isv[idx] = 1

nb_sv = len(Isv.nonzero()[0])

# Offset

if nb_sv > 1:

b = (Isv.T).dot( l - Ker.dot(L.dot(alpha)) )/ nb_sv

else:

b = 0

# Continuous score function

f_test = alpha.T.dot(LKXtest) + b

# Binary classification function

C_test = np.sign(f_test) # decision function in {-1,1}

accuracy_test = compute_purity(0.5*(1+C_test),Cgt_test,nc) # 0.5*(1+C_test) in {0,1}

# Print

print('Linear SVM, iter, diff_alpha, acc :',str(k),str(diff_alpha)[:7],str(accuracy_test)[:5])

Linear SVM, iter, diff_alpha, acc : 4 0.0 83.5

代码

文本

Run kernel SVM

代码

文本

[9]

# Run kernel SVM

# Compute Gaussian kernel, L, Q

sigma = 0.5; sigma2 = sigma**2

Ddist = sklearn.metrics.pairwise.pairwise_distances(Xtrain, Xtrain, metric='euclidean', n_jobs=1)

Ker = np.exp(- Ddist**2 / sigma2)

Ddist = sklearn.metrics.pairwise.pairwise_distances(Xtrain, Xtest, metric='euclidean', n_jobs=1)

KXtest = np.exp(- Ddist**2 / sigma2)

l = l_train

L = np.diag(l)

Q = L.dot(Ker.dot(L))

# Time steps

tau_alpha = 10/ np.linalg.norm(Q,2)

tau_beta = 0.1/ np.linalg.norm(L,2)

# For conjuguate gradient

Acg = tau_alpha* Q + np.eye(n)

# Pre-compute J.K(Xtest) for test data

LKXtest = L.dot(KXtest)

# Error parameter

lamb = 3 # acc: 87.5

# Initialization

alpha = np.zeros([n])

beta = 0.0

alpha_old = alpha

# Loop

k = 0

diff_alpha = 1e6

num_iter = 201

while (diff_alpha>1e-3) & (k<num_iter):

# Update iteration

k += 1

# Update alpha

# Approximate solution with conjuguate gradient

b0 = alpha + tau_alpha - tau_alpha* l* beta

alpha, _ = scipy.sparse.linalg.cg(Acg, b0, x0=alpha, tol=1e-3, maxiter=50)

alpha[alpha<0.0] = 0 # Projection on [0,+infty]

alpha[alpha>lamb] = lamb # Projection on [-infty,lamb]

# Update beta

beta = beta + tau_beta* l.T.dot(alpha)

# Stopping condition

diff_alpha = np.linalg.norm(alpha-alpha_old)

alpha_old = alpha

# Plot

if not(k%10) or (diff_alpha<1e-3):

# Indicator function of support vectors

idx = np.where( np.abs(alpha)>0.25* np.max(np.abs(alpha)) )

Isv = np.zeros([n]); Isv[idx] = 1

nb_sv = len(Isv.nonzero()[0])

# Offset

if nb_sv > 1:

b = (Isv.T).dot( l - Ker.dot(L.dot(alpha)) )/ nb_sv

else:

b = 0

# Continuous score function

f_test = alpha.T.dot(LKXtest) + b

# Binary classification function

C_test = np.sign(f_test) # decision function in {-1,1}

accuracy_test = compute_purity(0.5*(1+C_test),Cgt_test,nc) # 0.5*(1+C_test) in {0,1}

# Print

# print('iter, diff_alpha',str(k),str(diff_alpha)[:7])

# print('acc',str(accuracy_test)[:5])

print('Kernel SVM iter, diff_alpha :',str(k),str(diff_alpha)[:7])

print(' acc :',str(accuracy_test)[:5])

Kernel SVM  iter, diff_alpha : 100 0.00099
            acc : 87.5

代码

文本

[ ]

代码

文本

[ ]

代码

文本

Machine Learning

点个赞吧

本文被以下合集收录

Graph Machine learning

xuxh@dp.tech

更新于 2024-10-08

44 篇0 人关注