src/optimization/BFGS.cpp

/* -*- mode: c++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */

 /*
 Copyright (C) 2009 Frédéric Degraeve

 This file is part of QuantLib, a free-software/open-source library
 for financial quantitative analysts and developers - http://quantlib.org/

 QuantLib is free software: you can redistribute it and/or modify it
 under the terms of the QuantLib license.  You should have received a
 copy of the license along with this program; if not, please email
 <quantlib-dev@lists.sf.net>. The license is also available online at
 <http://quantlib.org/license.shtml>.

 This program is distributed in the hope that it will be useful, but WITHOUT
 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
 FOR A PARTICULAR PURPOSE.  See the license for more details.
*/

#include "optimization/BFGS.hpp"
#include "optimization/Problem.hpp"
#include "optimization/LineSearch.hpp"

namespace QuantLib {

    DynamicVector<RealType> BFGS::getUpdatedDirection(const Problem& P,
                                                      RealType,
                                                      const DynamicVector<RealType>& oldGradient) {
        if (inverseHessian_.getNRow() == 0)
        {
            // first time in this update, we create needed structures
            inverseHessian_ = DynamicRectMatrix<RealType>(P.currentValue().size(),
                                                          P.currentValue().size(), 0.);
            for (size_t i = 0; i < P.currentValue().size(); ++i)
                inverseHessian_(i,i) = 1.;
        }

        DynamicVector<RealType> diffGradient;
        DynamicVector<RealType> diffGradientWithHessianApplied(P.currentValue().size(), 0.);

        diffGradient = lineSearch_->lastGradient() - oldGradient;
        for (size_t i = 0; i < P.currentValue().size(); ++i)
            for (size_t j = 0; j < P.currentValue().size(); ++j)
                diffGradientWithHessianApplied[i] += inverseHessian_(i,j) * diffGradient[j];

        double fac, fae, fad;
        double sumdg, sumxi;

        fac = fae = sumdg = sumxi = 0.;
        for (size_t i = 0; i < P.currentValue().size(); ++i)
        {
            fac += diffGradient[i] * lineSearch_->searchDirection()[i];
            fae += diffGradient[i] * diffGradientWithHessianApplied[i];
            sumdg += std::pow(diffGradient[i], 2.);
            sumxi += std::pow(lineSearch_->searchDirection()[i], 2.);
        }

        if (fac > std::sqrt(1e-8 * sumdg * sumxi))  // skip update if fac not sufficiently positive
        {
            fac = 1.0 / fac;
            fad = 1.0 / fae;
 
            for (size_t i = 0; i < P.currentValue().size(); ++i)
                diffGradient[i] = fac * lineSearch_->searchDirection()[i] - fad * diffGradientWithHessianApplied[i];

            for (size_t i = 0; i < P.currentValue().size(); ++i)
                for (size_t j = 0; j < P.currentValue().size(); ++j)
                {
                    inverseHessian_(i,j) += fac * lineSearch_->searchDirection()[i] * lineSearch_->searchDirection()[j];
                    inverseHessian_(i,j) -= fad * diffGradientWithHessianApplied[i] * diffGradientWithHessianApplied[j];
                    inverseHessian_(i,j) += fae * diffGradient[i] * diffGradient[j];
                }
        }
        //else
        //  throw "BFGS: FAC not sufficiently positive";


        DynamicVector<RealType> direction(P.currentValue().size());
        for (size_t i = 0; i < P.currentValue().size(); ++i)
        {
            direction[i] = 0.0;
            for (size_t j = 0; j < P.currentValue().size(); ++j)
                direction[i] -= inverseHessian_(i,j) * lineSearch_->lastGradient()[j];
        }

        return direction;
    }

}
Revision:	1782
Committed:	Wed Aug 22 02:28:28 2012 UTC (13 years, 2 months ago) by gezelter
File size:	3763 byte(s)
Log Message:	MERGE OpenMD development branch 1465:1781 into trunk
#	User	Rev	Content
1	gezelter	1741	/* -- mode: c++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -- */
2
3			/*
4			Copyright (C) 2009 Frédéric Degraeve
5
6			This file is part of QuantLib, a free-software/open-source library
7			for financial quantitative analysts and developers - http://quantlib.org/
8
9			QuantLib is free software: you can redistribute it and/or modify it
10			under the terms of the QuantLib license. You should have received a
11			copy of the license along with this program; if not, please email
12			<quantlib-dev@lists.sf.net>. The license is also available online at
13			<http://quantlib.org/license.shtml>.
14
15			This program is distributed in the hope that it will be useful, but WITHOUT
16			ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
17			FOR A PARTICULAR PURPOSE. See the license for more details.
18			*/
19
20			#include "optimization/BFGS.hpp"
21			#include "optimization/Problem.hpp"
22			#include "optimization/LineSearch.hpp"
23
24			namespace QuantLib {
25
26			DynamicVector<RealType> BFGS::getUpdatedDirection(const Problem& P,
27			RealType,
28			const DynamicVector<RealType>& oldGradient) {
29			if (inverseHessian_.getNRow() == 0)
30			{
31			// first time in this update, we create needed structures
32			inverseHessian_ = DynamicRectMatrix<RealType>(P.currentValue().size(),
33			P.currentValue().size(), 0.);
34			for (size_t i = 0; i < P.currentValue().size(); ++i)
35			inverseHessian_(i,i) = 1.;
36			}
37
38			DynamicVector<RealType> diffGradient;
39			DynamicVector<RealType> diffGradientWithHessianApplied(P.currentValue().size(), 0.);
40
41			diffGradient = lineSearch_->lastGradient() - oldGradient;
42			for (size_t i = 0; i < P.currentValue().size(); ++i)
43			for (size_t j = 0; j < P.currentValue().size(); ++j)
44			diffGradientWithHessianApplied[i] += inverseHessian_(i,j) * diffGradient[j];
45
46			double fac, fae, fad;
47			double sumdg, sumxi;
48
49			fac = fae = sumdg = sumxi = 0.;
50			for (size_t i = 0; i < P.currentValue().size(); ++i)
51			{
52			fac += diffGradient[i] * lineSearch_->searchDirection()[i];
53			fae += diffGradient[i] * diffGradientWithHessianApplied[i];
54			sumdg += std::pow(diffGradient[i], 2.);
55			sumxi += std::pow(lineSearch_->searchDirection()[i], 2.);
56			}
57
58			if (fac > std::sqrt(1e-8 * sumdg * sumxi)) // skip update if fac not sufficiently positive
59			{
60			fac = 1.0 / fac;
61			fad = 1.0 / fae;
62
63			for (size_t i = 0; i < P.currentValue().size(); ++i)
64			diffGradient[i] = fac * lineSearch_->searchDirection()[i] - fad * diffGradientWithHessianApplied[i];
65
66			for (size_t i = 0; i < P.currentValue().size(); ++i)
67			for (size_t j = 0; j < P.currentValue().size(); ++j)
68			{
69			inverseHessian_(i,j) += fac * lineSearch_->searchDirection()[i] * lineSearch_->searchDirection()[j];
70			inverseHessian_(i,j) -= fad * diffGradientWithHessianApplied[i] * diffGradientWithHessianApplied[j];
71			inverseHessian_(i,j) += fae * diffGradient[i] * diffGradient[j];
72			}
73			}
74			//else
75			// throw "BFGS: FAC not sufficiently positive";
76
77
78			DynamicVector<RealType> direction(P.currentValue().size());
79			for (size_t i = 0; i < P.currentValue().size(); ++i)
80			{
81			direction[i] = 0.0;
82			for (size_t j = 0; j < P.currentValue().size(); ++j)
83			direction[i] -= inverseHessian_(i,j) * lineSearch_->lastGradient()[j];
84			}
85
86			return direction;
87			}
88
89			}