MADNESS 0.10.1
nonlinsol.h
Go to the documentation of this file.
1/*
2 This file is part of MADNESS.
3
4 Copyright (C) 2007,2010 Oak Ridge National Laboratory
5
6 This program is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 2 of the License, or
9 (at your option) any later version.
10
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, write to the Free Software
18 Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19
20 For more information please contact:
21
22 Robert J. Harrison
23 Oak Ridge National Laboratory
24 One Bethel Valley Road
25 P.O. Box 2008, MS-6367
26
27 email: harrisonrj@ornl.gov
28 tel: 865-241-3937
29 fax: 865-572-0680
30
31 $Id$
32*/
33
34#ifndef MADNESS_EXAMPLES_NONLINSOL_H__INCLUDED
35#define MADNESS_EXAMPLES_NONLINSOL_H__INCLUDED
36
37/*!
38 \file nonlinsol.h
39 \brief Implementation of Krylov-subspace nonlinear equation solver
40 \defgroup nonlinearsolve Simple Krylov-subspace nonlinear equation solver
41 \ingroup mra
42
43 This class implements the solver described in
44 \verbatim
45 R. J. Harrison, Krylov subspace accelerated inexact newton method for linear
46 and nonlinear equations, J. Comput. Chem. 25 (2004), no. 3, 328-334.
47 \endverbatim
48 */
49
50#include <madness/mra/mra.h>
52
53namespace madness {
54
55
56 /// check for subspace linear dependency
57
58 /// @param[in] Q the input matrix for KAIN
59 /// @param[in,out] c the coefficients for constructing the new solution
60 /// @param[in] rcondtol rcond less than this will cause the subspace to be shrunk due to linear dependence
61 /// @param[in] cabsmax maximum element of c greater than this will cause the subspace to be shrunk due to linear dependence
62 template<typename C>
63 void check_linear_dependence(const Tensor<C>& Q, Tensor<C>& c, const double rcondtol, const double cabsmax,
64 bool do_print=true) {
65 double rcond = 1e-12;
66 int m = c.dim(0);
67
68 while(1){
69 c = KAIN(Q, rcond);
70 //if (world.rank() == 0) print("kain c:", c);
71// if(std::abs(c[m - 1]) < 3.0){
72 if (c.absmax()<cabsmax) {
73 break;
74 } else if(rcond < rcondtol){
75 if (do_print) print("Increasing subspace singular value threshold ", c[m - 1], rcond);
76 rcond *= 100;
77 } else {
78 if (do_print) print("Forcing full step due to subspace malfunction");
79 c = 0.0;
80 c[m - 1] = 1.0;
81 break;
82 }
83 }
84 }
85
86 /// A simple Krylov-subspace nonlinear equation solver
87
88 /// \ingroup nonlinearsolve
89 template<size_t NDIM>
91 unsigned int maxsub; ///< Maximum size of subspace dimension
92
93 std::vector<Function<double,NDIM> > ulist, rlist;
95
96 public:
97 void set_maxsub(const unsigned int &new_maxsub){
98 maxsub = new_maxsub;
99 }
100 unsigned int get_maxsub()const{
101 const unsigned int tmp = maxsub;
102 return tmp;
103 }
105
106 NonlinearSolverND(unsigned int maxsub = 10) : maxsub(maxsub), do_print(false) {}
107
108 /// Computes next trial solution vector
109
110 /// You are responsible for performing step restriction or line search
111 /// (not necessary for linear problems).
112 ///
113 /// @param u Current solution vector
114 /// @param r Corresponding residual
115 /// @return Next trial solution vector
116 /// @param[in] rcondtol rcond less than this will cause the subspace to be shrunk due to linear dependence
117 /// @param[in] cabsmax maximum element of c greater than this will cause the subspace to be shrunk due to linear dependence
119 const double rcondtol=1e-8, const double cabsmax=1000.0) {
120 if (maxsub==1) return u-r;
121 int iter = ulist.size();
122 ulist.push_back(u);
123 rlist.push_back(r);
124
125 // Solve subspace equations
126 real_tensor Qnew(iter+1,iter+1);
127 if (iter>0) Qnew(Slice(0,-2),Slice(0,-2)) = Q;
128 for (int i=0; i<=iter; i++) {
129 Qnew(i,iter) = inner(ulist[i],rlist[iter]);
130 Qnew(iter,i) = inner(ulist[iter],rlist[i]);
131 }
132 // ulist and rlist are now either compressed or redundant -- change back to compressed or reconstructed0
133 TreeState operating_state = u.get_impl()->get_tensor_type()==TT_FULL ? compressed : reconstructed;
134 change_tree_state(ulist,operating_state,true);
135 change_tree_state(rlist,operating_state,true);
136
137 Q = Qnew;
138 real_tensor c = KAIN(Q);
139 check_linear_dependence(Q,c,rcondtol,cabsmax);
140 if (do_print) print("subspace solution",c);
141
142 // Form new solution in u, gaxpy in done in reconstructed or compressed state
143 Function<double,NDIM> unew = FunctionFactory<double,NDIM>(u.world()).treestate(operating_state);
144 // if (ulist[0].is_compressed()) unew.compress();
145 for (int i=0; i<=iter; i++) {
146 unew.gaxpy(1.0,ulist[i], c[i]);
147 unew.gaxpy(1.0,rlist[i],-c[i]);
148 }
149 unew.truncate();
150
151 if (ulist.size() == maxsub) {
152 ulist.erase(ulist.begin());
153 rlist.erase(rlist.begin());
154 Q = copy(Q(Slice(1,-1),Slice(1,-1)));
155 }
156 return unew;
157 }
158 };
159
160 // backwards compatibility
162
163
164 template <class T>
166 T operator()() {return T();}
167 };
168
169
170 // The default constructor for functions does not initialize
171 // them to any value, but the solver needs functions initialized
172 // to zero for which we also need the world object.
173 template<typename T, std::size_t NDIM>
176 const int n=-1;
177
178 /// @param[in] world the world
179 /// @param[in] nn the number of functions in a given vector
181
182 /// allocate a vector of n empty functions
183 std::vector<Function<T, NDIM> > operator()() {
184 return zero_functions<T, NDIM>(world, n);
185 }
186 };
187
188
189
190 /// Generalized version of NonlinearSolver not limited to a single madness function
191
192 /// \ingroup nonlinearsolve
193 ///
194 /// This solves the equation \f$r(u) = 0\f$ where u and r are both
195 /// of type \c T and inner products between two items of type \c T
196 /// produce a number of type \c C (defaulting to double). The type \c T
197 /// must support storage in an STL vector, scaling by a constant
198 /// of type \c C, inplace addition (+=), subtraction, allocation with
199 /// value zero, and inner products computed with the interface \c
200 /// inner(a,b). Have a look in examples/testsolver.cc for a
201 /// simple but complete example, and in examples/h2dynamic.cc for a
202 /// more complex example.
203 ///
204 /// I've not yet tested with anything except \c C=double and I think
205 /// that the KAIN routine will need extending for anything else.
206 template <class T, class C = double, class Alloc = default_allocator<T> >
208 unsigned int maxsub; ///< Maximum size of subspace dimension
209 Alloc alloc;
210 std::vector<T> ulist, rlist, plist; ///< Subspace information
212 Tensor<C> c; ///< coefficients for linear combination
213 public:
215
216 XNonlinearSolver(const Alloc& alloc = Alloc(),bool print=false)
217 : maxsub(10)
218 , alloc(alloc)
219 , do_print(print)
220 {}
221
223 : maxsub(other.maxsub)
224 , alloc(other.alloc)
225 , do_print(other.do_print)
226 {}
227
228
229 std::vector<T>& get_ulist() {return ulist;}
230 std::vector<T>& get_rlist() {return rlist;}
231 std::vector<T>& get_plist() {return plist;}
232
233 void set_maxsub(int maxsub) {this->maxsub = maxsub;}
234 Tensor<C> get_c() const {return c;}
235
237 ulist.clear();
238 rlist.clear();
239 plist.clear();
240 Q=Tensor<C>();
241 }
242
243 /// Computes next trial solution vector
244
245 /// You are responsible for performing step restriction or line search
246 /// (not necessary for linear problems).
247 ///
248 /// @param u Current solution vector
249 /// @param r Corresponding residual
250 /// @return Next trial solution vector
251 /// @param[in] rcondtol rcond less than this will cause the subspace to be shrunk due to linear dependence
252 /// @param[in] cabsmax maximum element of c greater than this will cause the subspace to be shrunk due to li
253 T update(const T& u, const T& r, const double rcondtol=1e-8, const double cabsmax=1000.0) {
254 if (maxsub==1) return u-r;
255 int iter = ulist.size();
256 ulist.push_back(u);
257 rlist.push_back(r);
258
259 // Solve subspace equations
260 Tensor<C> Qnew(iter+1,iter+1);
261 if (iter>0) Qnew(Slice(0,-2),Slice(0,-2)) = Q;
262 for (int i=0; i<=iter; i++) {
263 Qnew(i,iter) = inner(ulist[i],rlist[iter]);
264 Qnew(iter,i) = inner(ulist[iter],rlist[i]);
265 }
266 Q = Qnew;
267 c = KAIN(Q);
268
269 check_linear_dependence(Q,c,rcondtol,cabsmax,do_print);
270 if (do_print) print("subspace solution",c);
271
272 // Form new solution in u
273 T unew = alloc();
274 for (int i=0; i<=iter; i++) {
275 unew += (ulist[i] - rlist[i])*c[i];
276 }
277
278 if (ulist.size() == maxsub) {
279 ulist.erase(ulist.begin());
280 rlist.erase(rlist.begin());
281 Q = copy(Q(Slice(1,-1),Slice(1,-1)));
282 }
283 return unew;
284 }
285
286 /// Computes next trial solution vector
287
288 /// this version of update avoids using the residual by computing it on the fly
289 /// note the distinction between u_preliminary (input) and u_kain (output)
290 /// residual[i] = u_kain[i] - u_preliminary[i+1]
291 /// ulist[i] = u_kain[i]
292 /// plist[i] = u_preliminary[i]
293 /// @param[in] u_preliminary: new solution before KAIN
294 /// @param[out] u_kain: new solution after KAIN
295 T update(const T& u_preliminary, const double rcondtol=1e-8, const double cabsmax=1000.0) {
296 if (maxsub==1) return u_preliminary;
297
298 // check if T is a madness function or madness function vector, then we need to know the tree state
300
301 // works for both Function and FunctionVector
302 auto get_operating_state = [](const T& v) {
303 TreeState state=unknown;
304 if constexpr (is_madness_function<T>::value) {
305 state=v.get_impl()->get_tensor_type()==TT_FULL ? compressed : reconstructed;
306 } else if constexpr (is_madness_function_vector<T>::value) {
307 state=v[0].get_impl()->get_tensor_type()==TT_FULL ? compressed : reconstructed;
308 }
309 return state;
310 };
311
312 // do we work in compressed or reconstructed form?
313 TreeState operating_state = get_operating_state(u_preliminary);
314
315 int iter = ulist.size()-1;
316 MADNESS_CHECK_THROW(iter>=0,"ulist must have size==1 at least -- forgot to initialize?");
317 plist.push_back(u_preliminary);
318 MADNESS_CHECK_THROW(ulist.size()+1==plist.size(),"ulist and plist have incorrect size -- forgot to initialize?");
319
320
321 // Solve subspace equations
322 // Q_ij = < u_kain[i] | r[j] > = < u_kain[i] | u_kain[j] - u_preliminary[j+1] >
323 Tensor<C> Qnew(iter+1,iter+1);
324 if (iter>0) Qnew(Slice(0,-2),Slice(0,-2)) = Q;
325 for (int i=0; i<=iter; i++) {
326 Qnew(i,iter) = inner(ulist[i],ulist[iter]) - inner(ulist[i],plist[iter+1]);
327 Qnew(iter,i) = inner(ulist[iter],ulist[i]) - inner(ulist[iter],plist[i+1]);
328 }
329 // ulist and rlist are now either compressed or redundant -- change back to compressed or reconstructed0
330 if constexpr (do_tree_states) {
331 for (auto& u : ulist) change_tree_state(u,operating_state,true);
332 for (auto& p : plist) change_tree_state(p,operating_state,true);
333 }
334
335 Q = Qnew;
336 c = KAIN(Q);
337
338 check_linear_dependence(Q,c,rcondtol,cabsmax,do_print);
339 if (do_print) print("subspace solution",c);
340
341 // Form new solution in u
342 T unew = alloc();
343 for (int i=0; i<=iter; i++) {
344// unew += (ulist[i] - rlist[i])*c[i];
345 unew += (plist[i+1])*c[i];
346 }
347 if constexpr (is_madness_function<T>::value) unew.reconstruct();
349 ulist.push_back(unew);
350
351 if (ulist.size() == maxsub) {
352 ulist.erase(ulist.begin());
353 if (not rlist.empty()) rlist.erase(rlist.begin());
354 if (not plist.empty()) plist.erase(plist.begin());
355 Q = copy(Q(Slice(1,-1),Slice(1,-1)));
356 }
357 return unew;
358 }
359
360 void initialize(const T& u_initial) {
362 ulist.push_back(u_initial); // initial guess
363 plist.push_back(alloc()); // empty function
364 }
365
366 };
367
368
369 template<typename T, std::size_t NDIM>
370 static inline XNonlinearSolver<std::vector<Function<T,NDIM>>,T,vector_function_allocator<T,NDIM>>
375
376
379
380
381}
382#endif
FunctionFactory implements the named-parameter idiom for Function.
Definition function_factory.h:86
FunctionFactory & treestate(const TreeState state)
Definition function_factory.h:173
A multiresolution adaptive numerical function.
Definition mra.h:139
Function< T, NDIM > & truncate(double tol=0.0, bool fence=true)
Truncate the function with optional fence. Compresses with fence if not compressed.
Definition mra.h:642
std::size_t size() const
Returns the number of coefficients in the function ... collective global sum.
Definition mra.h:573
Function< T, NDIM > & gaxpy(const T &alpha, const Function< Q, NDIM > &other, const R &beta, bool fence=true)
Inplace, general bi-linear operation in wavelet basis. No communication except for optional fence.
Definition mra.h:1025
A simple Krylov-subspace nonlinear equation solver.
Definition nonlinsol.h:90
void set_maxsub(const unsigned int &new_maxsub)
Definition nonlinsol.h:97
real_tensor Q
Definition nonlinsol.h:94
bool do_print
Definition nonlinsol.h:104
std::vector< Function< double, NDIM > > ulist
Definition nonlinsol.h:93
Function< double, NDIM > update(const Function< double, NDIM > &u, const Function< double, NDIM > &r, const double rcondtol=1e-8, const double cabsmax=1000.0)
Computes next trial solution vector.
Definition nonlinsol.h:118
unsigned int get_maxsub() const
Definition nonlinsol.h:100
NonlinearSolverND(unsigned int maxsub=10)
Definition nonlinsol.h:106
unsigned int maxsub
Maximum size of subspace dimension.
Definition nonlinsol.h:91
std::vector< Function< double, NDIM > > rlist
Definition nonlinsol.h:93
A slice defines a sub-range or patch of a dimension.
Definition slice.h:103
A tensor is a multidimensional array.
Definition tensor.h:317
A parallel world class.
Definition world.h:132
Generalized version of NonlinearSolver not limited to a single madness function.
Definition nonlinsol.h:207
void set_maxsub(int maxsub)
Definition nonlinsol.h:233
XNonlinearSolver(const Alloc &alloc=Alloc(), bool print=false)
Definition nonlinsol.h:216
void clear_subspace()
Definition nonlinsol.h:236
Tensor< C > c
coefficients for linear combination
Definition nonlinsol.h:212
void initialize(const T &u_initial)
Definition nonlinsol.h:360
Tensor< C > Q
Definition nonlinsol.h:211
std::vector< T > & get_rlist()
Definition nonlinsol.h:230
std::vector< T > ulist
Definition nonlinsol.h:210
Tensor< C > get_c() const
Definition nonlinsol.h:234
std::vector< T > & get_ulist()
Definition nonlinsol.h:229
std::vector< T > rlist
Definition nonlinsol.h:210
Alloc alloc
Definition nonlinsol.h:209
T update(const T &u_preliminary, const double rcondtol=1e-8, const double cabsmax=1000.0)
Computes next trial solution vector.
Definition nonlinsol.h:295
T update(const T &u, const T &r, const double rcondtol=1e-8, const double cabsmax=1000.0)
Computes next trial solution vector.
Definition nonlinsol.h:253
bool do_print
Definition nonlinsol.h:214
std::vector< T > plist
Subspace information.
Definition nonlinsol.h:210
XNonlinearSolver(const XNonlinearSolver &other)
Definition nonlinsol.h:222
unsigned int maxsub
Maximum size of subspace dimension.
Definition nonlinsol.h:208
std::vector< T > & get_plist()
Definition nonlinsol.h:231
char * p(char *buf, const char *name, int k, int initial_level, double thresh, int order)
Definition derivatives.cc:72
auto T(World &world, response_space &f) -> response_space
Definition global_functions.cc:34
static const double v
Definition hatom_sf_dirac.cc:20
static double u(double r, double c)
Definition he.cc:20
#define MADNESS_CHECK_THROW(condition, msg)
Check a condition — even in a release build the condition is always evaluated so it can have side eff...
Definition madness_exception.h:207
Main include file for MADNESS and defines Function interface.
Namespace for all elements and tools of MADNESS.
Definition DFParameters.h:10
Tensor< T > KAIN(const Tensor< T > &Q, double rcond=1e-12)
Solves non-linear equation using KAIN (returns coefficients to compute next vector)
Definition solvers.h:98
NonlinearSolverND< 3 > NonlinearSolver
Definition nonlinsol.h:161
TreeState
Definition funcdefaults.h:59
@ reconstructed
s coeffs at the leaves only
Definition funcdefaults.h:60
@ unknown
Definition funcdefaults.h:68
@ compressed
d coeffs in internal nodes, s and d coeffs at the root
Definition funcdefaults.h:61
const std::vector< Function< T, NDIM > > & reconstruct(const std::vector< Function< T, NDIM > > &v)
reconstruct a vector of functions
Definition vmra.h:162
void check_linear_dependence(const Tensor< C > &Q, Tensor< C > &c, const double rcondtol, const double cabsmax, bool do_print=true)
check for subspace linear dependency
Definition nonlinsol.h:63
void print(const T &t, const Ts &... ts)
Print items to std::cout (items separated by spaces) and terminate with a new line.
Definition print.h:225
@ TT_FULL
Definition gentensor.h:120
const Function< T, NDIM > & change_tree_state(const Function< T, NDIM > &f, const TreeState finalstate, bool fence=true)
change tree state of a function
Definition mra.h:2807
XNonlinearSolver< std::vector< Function< double, 6 > >, double, vector_function_allocator< double, 6 > > NonlinearVectorSolver_6d
Definition nonlinsol.h:378
double inner(response_space &a, response_space &b)
Definition response_functions.h:442
XNonlinearSolver< std::vector< Function< double, 3 > >, double, vector_function_allocator< double, 3 > > NonlinearVectorSolver_3d
Definition nonlinsol.h:377
static XNonlinearSolver< std::vector< Function< T, NDIM > >, T, vector_function_allocator< T, NDIM > > nonlinear_vector_solver(World &world, const long nvec)
Definition nonlinsol.h:371
Function< T, NDIM > copy(const Function< T, NDIM > &f, const std::shared_ptr< WorldDCPmapInterface< Key< NDIM > > > &pmap, bool fence=true)
Create a new copy of the function with different distribution and optional fence.
Definition mra.h:2066
double Q(double a)
Definition relops.cc:20
static const double c
Definition relops.cc:10
static const double m
Definition relops.cc:9
Defines interfaces for optimization and non-linear equation solvers.
Definition nonlinsol.h:165
T operator()()
Definition nonlinsol.h:166
Definition mra.h:2851
Definition nonlinsol.h:174
const int n
Definition nonlinsol.h:176
World & world
Definition nonlinsol.h:175
vector_function_allocator(World &world, const int nn)
Definition nonlinsol.h:180
std::vector< Function< T, NDIM > > operator()()
allocate a vector of n empty functions
Definition nonlinsol.h:183
void e()
Definition test_sig.cc:75