| 1 | //
 | 
|---|
| 2 | // dfp.cc
 | 
|---|
| 3 | //
 | 
|---|
| 4 | // Copyright (C) 1996 Limit Point Systems, Inc.
 | 
|---|
| 5 | //
 | 
|---|
| 6 | // Author: Edward Seidl <seidl@janed.com>
 | 
|---|
| 7 | // Maintainer: LPS
 | 
|---|
| 8 | //
 | 
|---|
| 9 | // This file is part of the SC Toolkit.
 | 
|---|
| 10 | //
 | 
|---|
| 11 | // The SC Toolkit is free software; you can redistribute it and/or modify
 | 
|---|
| 12 | // it under the terms of the GNU Library General Public License as published by
 | 
|---|
| 13 | // the Free Software Foundation; either version 2, or (at your option)
 | 
|---|
| 14 | // any later version.
 | 
|---|
| 15 | //
 | 
|---|
| 16 | // The SC Toolkit is distributed in the hope that it will be useful,
 | 
|---|
| 17 | // but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
|---|
| 18 | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
|---|
| 19 | // GNU Library General Public License for more details.
 | 
|---|
| 20 | //
 | 
|---|
| 21 | // You should have received a copy of the GNU Library General Public License
 | 
|---|
| 22 | // along with the SC Toolkit; see the file COPYING.LIB.  If not, write to
 | 
|---|
| 23 | // the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.
 | 
|---|
| 24 | //
 | 
|---|
| 25 | // The U.S. Government is granted a limited license as per AL 91-7.
 | 
|---|
| 26 | //
 | 
|---|
| 27 | 
 | 
|---|
| 28 | #include <math.h>
 | 
|---|
| 29 | 
 | 
|---|
| 30 | #include <util/state/stateio.h>
 | 
|---|
| 31 | #include <math/optimize/update.h>
 | 
|---|
| 32 | #include <math/optimize/transform.h>
 | 
|---|
| 33 | #include <util/keyval/keyval.h>
 | 
|---|
| 34 | 
 | 
|---|
| 35 | using namespace sc;
 | 
|---|
| 36 | 
 | 
|---|
| 37 | /////////////////////////////////////////////////////////////////////////
 | 
|---|
| 38 | // DFPUpdate
 | 
|---|
| 39 | 
 | 
|---|
| 40 | static ClassDesc DFPUpdate_cd(
 | 
|---|
| 41 |   typeid(DFPUpdate),"DFPUpdate",1,"public HessianUpdate",
 | 
|---|
| 42 |   create<DFPUpdate>, create<DFPUpdate>, create<DFPUpdate>);
 | 
|---|
| 43 | 
 | 
|---|
| 44 | DFPUpdate::DFPUpdate()
 | 
|---|
| 45 | {
 | 
|---|
| 46 | }
 | 
|---|
| 47 | 
 | 
|---|
| 48 | DFPUpdate::DFPUpdate(const Ref<KeyVal>&keyval):
 | 
|---|
| 49 |   HessianUpdate(keyval)
 | 
|---|
| 50 | {
 | 
|---|
| 51 |   if (keyval->exists("xprev") && keyval->exists("gprev")) {
 | 
|---|
| 52 |     Ref<SCMatrixKit> k = SCMatrixKit::default_matrixkit();
 | 
|---|
| 53 |     RefSCDimension dim = new SCDimension(keyval->count("xprev"));
 | 
|---|
| 54 |     xprev = k->vector(dim);
 | 
|---|
| 55 |     gprev = k->vector(dim);
 | 
|---|
| 56 |     for (int i=0; i<dim.n(); i++) {
 | 
|---|
| 57 |       xprev(i) = keyval->doublevalue("xprev",i);
 | 
|---|
| 58 |       gprev(i) = keyval->doublevalue("gprev",i);
 | 
|---|
| 59 |     }
 | 
|---|
| 60 |   }
 | 
|---|
| 61 | }
 | 
|---|
| 62 | 
 | 
|---|
| 63 | DFPUpdate::DFPUpdate(StateIn&s):
 | 
|---|
| 64 |   SavableState(s),
 | 
|---|
| 65 |   HessianUpdate(s)
 | 
|---|
| 66 | {
 | 
|---|
| 67 |   Ref<SCMatrixKit> k = SCMatrixKit::default_matrixkit();
 | 
|---|
| 68 |   RefSCDimension dim;
 | 
|---|
| 69 |   dim << SavableState::restore_state(s);
 | 
|---|
| 70 |   xprev = k->vector(dim);
 | 
|---|
| 71 |   gprev = k->vector(dim);
 | 
|---|
| 72 |   xprev.restore(s);
 | 
|---|
| 73 |   gprev.restore(s);
 | 
|---|
| 74 | }
 | 
|---|
| 75 | 
 | 
|---|
| 76 | DFPUpdate::~DFPUpdate()
 | 
|---|
| 77 | {
 | 
|---|
| 78 | }
 | 
|---|
| 79 | 
 | 
|---|
| 80 | void
 | 
|---|
| 81 | DFPUpdate::save_data_state(StateOut&s)
 | 
|---|
| 82 | {
 | 
|---|
| 83 |   HessianUpdate::save_data_state(s);
 | 
|---|
| 84 |   SavableState::save_state(xprev.dim().pointer(),s);
 | 
|---|
| 85 |   xprev.save(s);
 | 
|---|
| 86 |   gprev.save(s);
 | 
|---|
| 87 | }
 | 
|---|
| 88 | 
 | 
|---|
| 89 | void
 | 
|---|
| 90 | DFPUpdate::update(const RefSymmSCMatrix&ihessian,const Ref<Function>&func,
 | 
|---|
| 91 |                   const RefSCVector&xn,const RefSCVector&gn)
 | 
|---|
| 92 | {
 | 
|---|
| 93 |   RefSCVector xnew, gnew;
 | 
|---|
| 94 | 
 | 
|---|
| 95 |   // the update for the inverse hessian differs from the update for the
 | 
|---|
| 96 |   // hessian in that xdisp and gdisp are exchanged
 | 
|---|
| 97 |   if (inverse_hessian_) {
 | 
|---|
| 98 |     xnew = xn;
 | 
|---|
| 99 |     gnew = gn;
 | 
|---|
| 100 |   } else {
 | 
|---|
| 101 |     xnew = gn;
 | 
|---|
| 102 |     gnew = xn;
 | 
|---|
| 103 |   }
 | 
|---|
| 104 |   
 | 
|---|
| 105 |   if (xprev.nonnull()) {
 | 
|---|
| 106 |     RefSCVector xdisp = xnew-xprev;
 | 
|---|
| 107 |     RefSCVector gdisp = gnew-gprev;
 | 
|---|
| 108 |     RefSCVector ihessian_gdisp = ihessian * gdisp;
 | 
|---|
| 109 |     double gdisp_ihessian_gdisp = ihessian_gdisp.scalar_product(gdisp);
 | 
|---|
| 110 |     double xdisp_gdisp = xdisp.scalar_product(gdisp);
 | 
|---|
| 111 |     ihessian.accumulate(
 | 
|---|
| 112 |         xdisp.symmetric_outer_product()*(1.0/xdisp_gdisp)
 | 
|---|
| 113 |         - ihessian_gdisp.symmetric_outer_product()*(1.0/gdisp_ihessian_gdisp)
 | 
|---|
| 114 |       );
 | 
|---|
| 115 |     xprev.assign(xnew);
 | 
|---|
| 116 |     gprev.assign(gnew);
 | 
|---|
| 117 |   } else {
 | 
|---|
| 118 |     xprev = xnew.copy();
 | 
|---|
| 119 |     gprev = gnew.copy();
 | 
|---|
| 120 |   }
 | 
|---|
| 121 | }
 | 
|---|
| 122 | 
 | 
|---|
| 123 | void
 | 
|---|
| 124 | DFPUpdate::apply_transform(const Ref<NonlinearTransform>& trans)
 | 
|---|
| 125 | {
 | 
|---|
| 126 |   if (trans.null()) return;
 | 
|---|
| 127 |   HessianUpdate::apply_transform(trans);
 | 
|---|
| 128 |   trans->transform_coordinates(xprev);
 | 
|---|
| 129 |   trans->transform_gradient(gprev);
 | 
|---|
| 130 | }
 | 
|---|
| 131 | 
 | 
|---|
| 132 | void
 | 
|---|
| 133 | DFPUpdate::set_inverse(void)
 | 
|---|
| 134 | {
 | 
|---|
| 135 |   HessianUpdate::set_inverse();
 | 
|---|
| 136 |   RefSCVector tmp;
 | 
|---|
| 137 |   tmp = xprev;
 | 
|---|
| 138 |   xprev = gprev;
 | 
|---|
| 139 |   gprev = tmp;
 | 
|---|
| 140 | }
 | 
|---|
| 141 | 
 | 
|---|
| 142 | /////////////////////////////////////////////////////////////////////////
 | 
|---|
| 143 | // BFGSUpdate
 | 
|---|
| 144 | 
 | 
|---|
| 145 | static ClassDesc BFGSUpdate_cd(
 | 
|---|
| 146 |   typeid(BFGSUpdate),"BFGSUpdate",1,"public HessianUpdate",
 | 
|---|
| 147 |   create<BFGSUpdate>, create<BFGSUpdate>, create<BFGSUpdate>);
 | 
|---|
| 148 | 
 | 
|---|
| 149 | BFGSUpdate::BFGSUpdate()
 | 
|---|
| 150 | {
 | 
|---|
| 151 | }
 | 
|---|
| 152 | 
 | 
|---|
| 153 | BFGSUpdate::BFGSUpdate(const Ref<KeyVal>&keyval):
 | 
|---|
| 154 |   DFPUpdate(keyval)
 | 
|---|
| 155 | {
 | 
|---|
| 156 | }
 | 
|---|
| 157 | 
 | 
|---|
| 158 | BFGSUpdate::BFGSUpdate(StateIn&s):
 | 
|---|
| 159 |   SavableState(s),
 | 
|---|
| 160 |   DFPUpdate(s)
 | 
|---|
| 161 | {
 | 
|---|
| 162 | }
 | 
|---|
| 163 | 
 | 
|---|
| 164 | BFGSUpdate::~BFGSUpdate()
 | 
|---|
| 165 | {
 | 
|---|
| 166 | }
 | 
|---|
| 167 | 
 | 
|---|
| 168 | void
 | 
|---|
| 169 | BFGSUpdate::save_data_state(StateOut&s)
 | 
|---|
| 170 | {
 | 
|---|
| 171 |   DFPUpdate::save_data_state(s);
 | 
|---|
| 172 | }
 | 
|---|
| 173 | 
 | 
|---|
| 174 | void
 | 
|---|
| 175 | BFGSUpdate::update(const RefSymmSCMatrix&ihessian,const Ref<Function>&func,
 | 
|---|
| 176 |                    const RefSCVector&xn,const RefSCVector&gn)
 | 
|---|
| 177 | {
 | 
|---|
| 178 |   RefSCVector xnew, gnew;
 | 
|---|
| 179 | 
 | 
|---|
| 180 |   // the update for the inverse hessian differs from the update for the
 | 
|---|
| 181 |   // hessian in that xdisp and gdisp are exchanged
 | 
|---|
| 182 |   if (inverse_hessian_) {
 | 
|---|
| 183 |     xnew = xn;
 | 
|---|
| 184 |     gnew = gn;
 | 
|---|
| 185 |   } else {
 | 
|---|
| 186 |     xnew = gn;
 | 
|---|
| 187 |     gnew = xn;
 | 
|---|
| 188 |   }
 | 
|---|
| 189 |   
 | 
|---|
| 190 |   if (xprev.nonnull()) {
 | 
|---|
| 191 |     RefSCVector xdisp = xnew-xprev;
 | 
|---|
| 192 |     RefSCVector gdisp = gnew-gprev;
 | 
|---|
| 193 |     RefSCVector ihessian_gdisp = ihessian * gdisp;
 | 
|---|
| 194 |     double gdisp_ihessian_gdisp = ihessian_gdisp.scalar_product(gdisp);
 | 
|---|
| 195 |     double xdisp_gdisp = xdisp.scalar_product(gdisp);
 | 
|---|
| 196 |     RefSCVector u =   xdisp*(1.0/xdisp_gdisp)
 | 
|---|
| 197 |                       - ihessian_gdisp*(1.0/gdisp_ihessian_gdisp);
 | 
|---|
| 198 |     ihessian.accumulate(
 | 
|---|
| 199 |         // DFP part
 | 
|---|
| 200 |         xdisp.symmetric_outer_product()*(1.0/xdisp_gdisp)
 | 
|---|
| 201 |         - ihessian_gdisp.symmetric_outer_product()*(1.0/gdisp_ihessian_gdisp)
 | 
|---|
| 202 |         // BFGS part
 | 
|---|
| 203 |         + u.symmetric_outer_product() * gdisp_ihessian_gdisp
 | 
|---|
| 204 |       );
 | 
|---|
| 205 |     xprev.assign(xnew);
 | 
|---|
| 206 |     gprev.assign(gnew);
 | 
|---|
| 207 |   } else {
 | 
|---|
| 208 |     xprev = xnew.copy();
 | 
|---|
| 209 |     gprev = gnew.copy();
 | 
|---|
| 210 |   }
 | 
|---|
| 211 | }
 | 
|---|
| 212 | 
 | 
|---|
| 213 | /////////////////////////////////////////////////////////////////////////////
 | 
|---|
| 214 | 
 | 
|---|
| 215 | // Local Variables:
 | 
|---|
| 216 | // mode: c++
 | 
|---|
| 217 | // c-file-style: "ETS"
 | 
|---|
| 218 | // End:
 | 
|---|