X-Git-Url: http://gitweb.michael.orlitzky.com/?p=octave.git;a=blobdiff_plain;f=optimization%2Fpreconditioned_conjugate_gradient_method.m;h=e2f841aefea06ec92e8bb1e8dbe85eb5f2b65747;hp=63943482c8c6dd1b47d916d9bdaf400521d6b992;hb=92116b34e755b3ef5de14a1777676bc09180f007;hpb=84b8fb9002d091f84d0205e923c3989d0138ec9e diff --git a/optimization/preconditioned_conjugate_gradient_method.m b/optimization/preconditioned_conjugate_gradient_method.m index 6394348..e2f841a 100644 --- a/optimization/preconditioned_conjugate_gradient_method.m +++ b/optimization/preconditioned_conjugate_gradient_method.m @@ -1,8 +1,8 @@ -function [x, k] = preconditioned_conjugate_gradient_method(Q, - M, - b, - x0, - tolerance, +function [x, k] = preconditioned_conjugate_gradient_method(Q, ... + M, ... + b, ... + x0, ... + tolerance, ... max_iterations) % % Solve, @@ -39,7 +39,7 @@ function [x, k] = preconditioned_conjugate_gradient_method(Q, % % OUTPUT: % - % - ``x`` - The solution to Qx=b. + % - ``x`` - The computed solution to Qx=b. % % - ``k`` - The ending value of k; that is, the number of % iterations that were performed. @@ -52,14 +52,25 @@ function [x, k] = preconditioned_conjugate_gradient_method(Q, % Conjugate-Gradient Method", we are supposed to define % d_{0} = -z_{0}, not -r_{0} as written. % + % The rather verbose name of this function was chosen to avoid + % conflicts with other implementations. + % % REFERENCES: % % 1. Guler, Osman. Foundations of Optimization. New York, Springer, - % 2010. + % 2010. + % + % 2. Shewchuk, Jonathan Richard. An Introduction to the Conjugate + % Gradient Method Without the Agonizing Pain, Edition 1.25. + % August 4, 1994. % + % We use this in the inner loop. + n = length(x0); + sqrt_n = floor(sqrt(n)); + % Set k=0 first, that way the references to xk,rk,zk,dk which - % immediately follow correspond to x0,r0,z0,d0 respectively. + % immediately follow correspond (semantically) to x0,r0,z0,d0. k = 0; xk = x0; @@ -67,12 +78,7 @@ function [x, k] = preconditioned_conjugate_gradient_method(Q, zk = M \ rk; dk = -zk; - for k = [ 0 : max_iterations ] - if (norm(rk) < tolerance) - x = xk; - return; - end - + while (k <= max_iterations && norm(rk, 'inf') > tolerance) % Used twice, avoid recomputation. rkzk = rk' * zk; @@ -80,13 +86,36 @@ function [x, k] = preconditioned_conjugate_gradient_method(Q, % do them both, so we precompute the more expensive operation. Qdk = Q * dk; - alpha_k = rkzk/(dk' * Qdk); + % We're going to divide by this quantity... + dkQdk = dk' * Qdk; + + % So if it's too close to zero, we replace it with something + % comparable but non-zero. + if (dkQdk < eps) + dkQdk = eps; + end + + alpha_k = rkzk/dkQdk; x_next = xk + (alpha_k * dk); - r_next = rk + (alpha_k * Qdk); + + % The recursive definition of r_next is prone to accumulate + % roundoff error. When sqrt(n) divides k, we recompute the + % residual to minimize this error. This modification was suggested + % by the second reference. + if (mod(k, sqrt_n) == 0) + r_next = Q*x_next - b; + else + r_next = rk + (alpha_k * Qdk); + end + z_next = M \ r_next; beta_next = (r_next' * z_next)/rkzk; d_next = -z_next + beta_next*dk; + % We potentially just performed one more iteration than necessary + % in order to simplify the loop. Note that due to the structure of + % our loop, we will have k > max_iterations when we fail to + % converge. k = k + 1; xk = x_next; rk = r_next; @@ -94,5 +123,6 @@ function [x, k] = preconditioned_conjugate_gradient_method(Q, dk = d_next; end + % If we make it here, one of the two stopping conditions was met. x = xk; end