-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathGLRT.m
150 lines (113 loc) · 4.74 KB
/
GLRT.m
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
function [ s, stat ] = GLRT(grad_f, hess_f, sigma, varargin)
% Lanczos Type Method for finding the global minimum of the regularised
% local quadratic model m(s) in a subspace S_j
%
% Input -
% f: objective function
% CurrentX: current iterate
% grad_f: current gradient
% hess_f: current hessian
%
% Optional Input -
% theta: algorithm parameter
% sigma0: initial regularisation
% outputLevel: 0, 1 or 2
%
% Output -
% s, global minimiser over a subspace
% stat: algortihm exit status
%% Process the Input
if nargin == 3
% use standart settings
theta = 1e-4; outputLevel = 2;
else
options = varargin{1};
[theta, outputLevel] = GLRT_Input(options);
end
%% Initialise
j = 1; % Loop counter
n = length(grad_f); % problem dimension
gamma0 = norm(grad_f);
Lanczos_Tol = 1e-10;
Lanczos_Options = struct('Lanczos_Tol', Lanczos_Tol);
Newton_Options = struct('Epsilon_Newton', 1e-6, 'IterMax_Newton', n*20, 'OutputLevel', outputLevel);
% Initialise the Algortihm
q_old_old = 0; q_old = grad_f/gamma0; beta_old = 0;
[ alpha, beta_new, q_new ] = Lanczos_Algorithm( q_old, q_old_old, hess_f, beta_old);
V = [q_old, q_new]; T = [alpha; beta_new];
% Compute the first multiplier
lambda = - alpha/2 + sqrt( (alpha/2)^2 + sigma*gamma0);
u = - lambda/sigma;
% Define a function. Shall accept row vectors as input
% m = @(s) s*grad_f + 1/2*s*hess_f*s' + 1/3*sigma*norm(s)^3;
% grad_m = @(s) (hess_f + sigma*norm(s) * eye(n))*s + grad_f;
%% Give out information
if outputLevel > 0
fprintf('\n \t \t GLRT: sigma = %1.2f. \n ', sigma);
fprintf( [ ' \n \t \t iter lambda ', ...
' beta_k * |u_k^(k)| theta*||u||^2 \t ||u|| \n' ] );
fprintf( ' \t \t %6.0f %13.3e \t %12.3e \t \t \t %8.3e \t \t %8.3e \n', ...
j, lambda, beta_new * abs(u(end)), theta*norm(u)^2, norm(u) );
end
%% Inner Loop over expanding subspaces
%while norm(gradM) > min([theta, sqrt(norm(grad_f))])*norm(grad_f) && j <= n
while beta_new * abs(u(end)) > theta*norm(u)^2 && j <= n
%% Create tridiagonal T and basis Q
j = j+1;
%[ Q, T ] = Lanczos( j, n, Q, T, CurrentX, hess_f);
% Move values around a little
q_old_old = q_old;
q_old = q_new;
beta_old = beta_new;
% Create new quantities
[ alpha, beta_new, q_new ] = Lanczos_Algorithm( q_old, q_old_old, hess_f, beta_old, Lanczos_Options);
% adjust the matrices
T = [[T; zeros(1, j-1)], [zeros(j-2, 1); beta_old; alpha; beta_new]];
% Check for a breakdown in the Lanczos algortihm
if beta_new < Lanczos_Tol
disp('there was a breakdown');
else
V = [V, q_new];
end
%% Solve for u in the current subspace
% We need to do an efficient cholesky factorisation and we need to
% estimate the smallest eigenvalue of T.
% Compute u by a Newton Type Method
[ u, lambda, phi ] = AdaptedNewton(n, T(1:j, 1:j), sigma, gamma0, Newton_Options) ;
% Does this u really minimise the local model over the current
% subspace?
% Create the identity
% if j ~= n
% I = eye(j+1);
% else
% I = eye(j);
% end
I = eye(j);
error = norm((T(1:j, 1:j) + lambda*I)*u + gamma0*I(:, 1));
% Also check positive semi definiteness:
smallestEV = eigs(T(1:j, 1:j) + lambda*I, 1, 'sa');
% Result: u does indeed minimise the local model globaly in the current
% subspace. Next, we can try to check whether the Matrices Q and T do
% as they should:
MatrixError = norm(V(:, 1:j)'*hess_f*V(:, 1:j) - T(1:j, 1:j));
%disp(MatrixError);
%% Update the model gradient and the loop counter
% gradM = grad_f + hess_f*s + lambda * s; % Gradient of the local model
%% Display information
if outputLevel > 0
fprintf( [ ' \n \t \t iter lambda ', ...
' beta_k * |u_k^(k)| theta*||u||^2 phi \t ||u|| \t \t Error \t \t smallestEV \t MatErr \n' ] );
fprintf( ' \t \t %6.0f %13.3e %12.3e \t \t \t \t %8.3e %8.3e \t %1.2e \t %1.4e \t %1.3f \t \t %1.3f \n', ...
j-1, lambda, beta_new * abs(u(end)), theta*norm(u)^2, phi, norm(u), error, smallestEV, MatrixError );
end
% We will stop the iteration as soon as we either drive the norm of the gradient under the
% relative stopping criterion or we hit the iteration limit n, which is the problem dimension
end
% Recover s from here:
s = V(:, 1:j)*u;
if j >= n && beta_new * abs(u(end)) > theta*norm(u)^2
stat = 0; % Failed to converge while trying to minimise the local model
else
stat = 1; % everything is fine
end
end