forked from tourmaline612/FSVM
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathFSVM_train_update_St.m
70 lines (61 loc) · 1.98 KB
/
FSVM_train_update_St.m
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
function [ model, L ] = FSVM_train_update_St(Ytrain, trainset, option, opts, rho)
% By using the St (the total scatter matrix), updating St
% trainset: nxd
%
% parameter settings
epsilon = opts.epsilon;
threshold = opts.threshold;
maxiter = opts.maxiter;
alpha = opts.alpha;
coef = opts.coef;
% calculate the total scatter matrix
S = cov( trainset, 1 ); % equal to cov( trainset ) * (size(trainset,1)-1)/size(trainset,1);
[ U, E ] = eig( full(S) );
[ dummy, order ] = sort( diag(E), 'descend' );
U = U( : , order );
% Semi-Whiten process
dummy = dummy + epsilon;
Sigma = diag((dummy*rho).^(-alpha));
M = U * Sigma * U'; %M=L'L
L = Sigma.^(alpha)*U';
stop = 1; iter = 1; t = 0.1; beta = 0.9;
% initialize the (w,b)
model = svmtrain( Ytrain, trainset, option);
w = calc_w(model);
rho_ = rho/norm(w);
w = normalizemeanstd(w);
% alternatively update w and M
while stop > threshold && iter <= maxiter
% update M with (w,b)
A = w * w' + epsilon * eye(size(w,1));
gradient = - 0.5 * inv(M) * A * inv(M) + rho_ * S;
M_tmp = M - t * gradient;
M_tmp = M_tmp + epsilon*eye(size(M_tmp,1));
[U_tmp, E_tmp] = eig(M_tmp);
[ dummy_M, order_M ] = sort( diag(E_tmp), 'descend' );
U_tmp = U_tmp( : , order_M );
Sigma_tmp = diag(dummy_M);
U_tmp = U_tmp( : , [1:numel(dummy_M)] );
M_update = U_tmp*Sigma_tmp*U_tmp';
M = M_update;
% update (w,b) with M and input Ztrain:kxn
L = Sigma_tmp*U';
Ztrain = trainset*L';
model = svmtrain( Ytrain, Ztrain, option);
v = calc_w(model);
w = L' * v;
rho_ = rho/norm(w);
w = bsxfun(@rdivide, w, sqrt(sum(w.^2,1)));
% the objective
obj = -sum(model.obj) + rho_ * trace(S * M_update);
% the stop criteria
if iter > 1
stop = obj_previous - obj;
end
% update the total scatter matrix
S = update_St(coef, trainset, Ztrain);
t = beta * t;
obj_previous = obj;
iter = iter+1;
end
end