// Copyright (C) 2013-2015 Kasper Kristensen // License: GPL-2 /* Given function f0. Define recursively higher order reverse mode derivatives: f0: R^(n) -> R^(m) ( x -> f0 (x) ) f1: R^(n+m) -> R^(n) ( (x,w1) -> f0'(x)*w1 ) f2: R^(n+m+n) -> R^(n+m) ( (x,w1,w2) -> f1'(x)*w2 ) f3: R^(n+m+n+n+m) -> R^(n+m+n) ( (x,w1,w2,w3) -> f2'(x)*w3 ) 1. We define a 'generalized symbol' to represent all of these. _Reverse_mode_AD_ is trivially obtained for this symbol by calling itself on a higher level. Each occurance on the tape will occupy O(n+m) memory units independent on the number of flops performed by f0. 2. _Double_versions_ of the generalized symbol are obtained using nested AD types to tape f0, then recursively tape forward and reverse mode sweeps. Finally, given (1) and (2) the macro TMB_ATOMIC_VECTOR_FUNCTION will generate the atomic symbol. */ /* general helper functions */ #ifdef CPPAD_FRAMEWORK namespace atomic{ /** \name User defined atomic functions \note The following procedure is automatically performed with the macro REGISTER_ATOMIC. \verbatim Given function f0. Define recursively higher order reverse mode derivatives: f0: R^(n) -> R^(m) ( x -> f0 (x) ) f1: R^(n+m) -> R^(n) ( (x,w1) -> f0'(x)*w1 ) f2: R^(n+m+n) -> R^(n+m) ( (x,w1,w2) -> f1'(x)*w2 ) f3: R^(n+m+n+n+m) -> R^(n+m+n) ( (x,w1,w2,w3) -> f2'(x)*w3 ) 1. We define a 'generalized symbol' to represent all of these. _Reverse_mode_AD_ is trivially obtained for this symbol by calling itself on a higher level. Each occurance on the tape will occupy O(n+m) memory units independent of the number of flops performed by f0. 2. _Double_versions_ of the generalized symbol are obtained using nested AD types to tape f0, then recursively tape forward and reverse mode sweeps. Finally, given (1) and (2) the macro TMB_ATOMIC_VECTOR_FUNCTION will generate the atomic symbol. \endverbatim @{ */ /** \brief Construct a tape of a given template _functor_ (Will be used to tape 'f0' for different nested AD types) */ template CppAD::ADFun* generate_tape(Func f, vector x_){ Rcout << "Generating tape\n"; int n=x_.size(); vector > x(n); for(int i=0;i(x_[i]); CppAD::Independent(x); vector > y=f(x); vector > y2(y.size()); for(int i=0;i* padf=new CppAD::ADFun(x,y2); return padf; } /** \brief Lift tape of fn up one level by taping forward and reverse sweeps. Note: x_ needs only have length equal to the input domain dimension of f0. Zeros are filled in for all range directions. */ template CppAD::ADFun* forrev(CppAD::ADFun >* padf, vector x_){ size_t n=padf->Domain(); size_t m=padf->Range(); vector > x(n+m); vector > y(n); for(int i=0;i(x_[i]); for(int i=x_.size();i(0); vector > tmp1(n); vector > tmp2(m); CppAD::Independent(x); for(size_t i=0;iForward(0,tmp1); y = padf->Reverse(1,tmp2); CppAD::ADFun* padf2=new CppAD::ADFun(x,y); delete padf; return padf2; } /** \brief Recursively apply forrev until the lowest Base level (double) */ template CppAD::ADFun* multi_forrev(CppAD::ADFun* padf, vector x_){ return multi_forrev(forrev(padf, x_), x_); } template <> CppAD::ADFun* multi_forrev(CppAD::ADFun* padf, vector x_) CSKIP({ return padf; }) /** \brief Tape symbol up to any order */ template CppAD::ADFun* tape_symbol(Func f, vector x){ typedef typename Func::ScalarType::value_type Base; CppAD::ADFun* f0=generate_tape(f,x); CppAD::ADFun* fn=multi_forrev(f0,x); return fn; } #ifdef _OPENMP #define NTHREADS config.nthreads #define THREAD omp_get_thread_num() #else #define NTHREADS 1 #define THREAD 0 #endif /** \brief General class to construct 'double versions' of the generalized symbol. */ template class UserFunctor> struct forrev_derivatives{ bool initialized; int n,m; forrev_derivatives(){ initialized=false; } /* ADFun pointers used by the double versions indexed as vpf[thread][level] */ CppAD::vector* > > vpf; void cpyADfunPointer(CppAD::ADFun* padf, int i){ padf->optimize(); vpf[0][i] = padf; /* Copy object for other threads */ for(int thread=1;thread(); vpf[thread][i]->operator=(*padf); } } void do_init(vector x){ UserFunctor f; n=x.size(); m=f(x).size(); UserFunctor > f0; UserFunctor > > f1; UserFunctor > > > f2; UserFunctor > > > > f3; vpf.resize(NTHREADS); for(int thread=0;thread x){ if(!initialized){ do_init(x); initialized=true; } } int get_output_dim(int input_dim){ int output_dim=-1; // Fibonacci type recursion for each 'column' if (input_dim == n) output_dim = m; else if (input_dim == n+m) output_dim = n; else if (input_dim == n+m+n) output_dim = n+m; else if (input_dim == n+m+n+n+m) output_dim = n+m+n; else Rf_error("get_output_dim failed"); return output_dim; } // Calculate level from input dimension int get_level(int input_dim){ int level=-1; if (input_dim == n) level = 0; else if (input_dim == n+m) level = 1; else if (input_dim == n+m+n) level = 2; else if (input_dim == n+m+n+n+m) level = 3; else Rf_error("get_level failed"); return level; } // Evaluate CppAD::vector operator()(CppAD::vector tx){ int level = get_level(tx.size()); return vpf[THREAD][level]->Forward(0,tx); } }; /* end class forrev_derivatives */ #undef NTHREADS #undef THREAD /** \brief Wrap user function into a functor, generate double versions, and construct atomic function in a namespace */ #define REGISTER_ATOMIC(USERFUNCTION) \ namespace USERFUNCTION##NAMESPACE{ \ template \ struct UserFunctor{ \ typedef Type ScalarType; \ vector operator()(vector x){ \ return USERFUNCTION(x); \ } \ }; \ atomic::forrev_derivatives double_version; \ TMB_ATOMIC_VECTOR_FUNCTION( \ generalized_symbol \ , \ double_version.get_output_dim(tx.size()) \ , \ ty = double_version(tx); \ , \ CppAD::vector concat(tx.size() + py.size()); \ for(size_t i=0; i < tx.size(); i++) concat[i] = tx[i]; \ for(size_t i=0; i < py.size(); i++) concat[tx.size()+i] = py[i]; \ px = generalized_symbol(concat); \ ) \ template \ vector generalized_symbol(vector x){ \ CppAD::vector xx(x.size()); \ for(int i=0;i yy=generalized_symbol(xx); \ vector y(yy.size()); \ for(int i=0;i USERFUNCTION(vector x){ \ USERFUNCTION##NAMESPACE::double_version.init(x); \ return USERFUNCTION##NAMESPACE::generalized_symbol(x); \ } \ vector > USERFUNCTION(vector > x){ \ return USERFUNCTION##NAMESPACE::generalized_symbol(x); \ } \ vector > > USERFUNCTION(vector > > x){ \ return USERFUNCTION##NAMESPACE::generalized_symbol(x); \ } \ vector > > > USERFUNCTION(vector > > > x){ \ return USERFUNCTION##NAMESPACE::generalized_symbol(x); \ } /** @} */ } /* end namespace atomic */ #endif // CPPAD_FRAMEWORK #ifdef TMBAD_FRAMEWORK namespace atomic { /** \brief User interface to checkpointing using TMBad \details This is the recommended way of constucting atomic functions without knowing the reverse mode derivatives. Usage: Within `objective_function` (or any other function) one can do ``` AtomicLocal F(Functor()); ``` - Each call to `F(x)` only generates one new operatation on the ad stack. - Thread safe because local. - `F` is owned by the operation stack and is automatically freed when no longer needed. */ template struct AtomicLocal { typedef TMBad::StdWrap > StdWrapFunctor; Functor F; TMBad::ADFun<> Tape; AtomicLocal(const Functor &F) : F(F) {} template vector operator()(const vector &x) { if ( (size_t) x.size() != Tape.Domain() ) { Tape = TMBad::ADFun<>( StdWrapFunctor(F), x).atomic(); } std::vector x_(x.data(), x.data() + x.size()); std::vector y_ = Tape(x_); vector y(y_); return y; } vector operator()(const vector &x) { return F(x); } }; /** \brief For backwards compatibility with CppAD \details Allocate an atomic function for each thread. Main purpuse is to support the `REGISTER_ATOMIC` macro. \tparam Functor assumed to have a default CTOR \warning Static atomic functions are never freed. */ template struct AtomicGlobal { #ifdef _OPENMP #define NTHREADS config.nthreads #define THREAD omp_get_thread_num() #else #define NTHREADS 1 #define THREAD 0 #endif std::vector< AtomicLocal >* p_; AtomicGlobal() { static std::vector< AtomicLocal >* p = new std::vector< AtomicLocal > (NTHREADS, Functor() ); p_ = p; } template vector operator()(const vector &x) { return ((*p_)[THREAD])(x); } #undef NTHREADS #undef THREAD }; #define REGISTER_ATOMIC(USERFUNCTION) \ namespace USERFUNCTION##NAMESPACE { \ template \ struct UserFunctor { \ typedef Type ScalarType; \ vector operator()(const vector &x) { \ return USERFUNCTION(x); \ } \ }; \ } \ vector USERFUNCTION(const vector &x) { \ typedef USERFUNCTION##NAMESPACE::UserFunctor Functor; \ return atomic::AtomicGlobal()(x); \ } \ vector USERFUNCTION(const vector &x) { \ typedef USERFUNCTION##NAMESPACE::UserFunctor Functor; \ return atomic::AtomicGlobal()(x); \ } } // End namespace atomic #endif // TMBAD_FRAMEWORK