Merge pull request #547 from stan-dev/cleanup/546-operands-partials

operands_and_partials refactor
stan-dev · May 24, 2017 · f1f056f · f1f056f
2 parents b5d61bf + ae81a2e
commit f1f056f
Show file tree

Hide file tree

Showing 188 changed files with 2,564 additions and 3,906 deletions.
diff --git a/stan/math/fwd/mat.hpp b/stan/math/fwd/mat.hpp
@@ -46,4 +46,6 @@
 #include <stan/math/fwd/mat/functor/gradient.hpp>
 #include <stan/math/fwd/mat/functor/jacobian.hpp>
 
+#include <stan/math/fwd/mat/meta/operands_and_partials.hpp>
+
 #endif
diff --git a/stan/math/fwd/mat/meta/operands_and_partials.hpp b/stan/math/fwd/mat/meta/operands_and_partials.hpp
@@ -0,0 +1,97 @@
+#ifndef STAN_MATH_FWD_MAT_META_OPERANDS_AND_PARTIALS_HPP
+#define STAN_MATH_FWD_MAT_META_OPERANDS_AND_PARTIALS_HPP
+
+#include <stan/math/fwd/mat/fun/typedefs.hpp>
+#include <stan/math/fwd/scal/meta/operands_and_partials.hpp>
+#include <stan/math/prim/scal/meta/broadcast_array.hpp>
+#include <vector>
+
+namespace stan {
+  namespace math {
+    namespace internal {
+      // Vectorized Univariate
+      template <typename Dx>
+      class ops_partials_edge<Dx, std::vector<fvar<Dx> > > {
+      public:
+        typedef std::vector<fvar<Dx> > Op;
+        typedef Eigen::Matrix<Dx, -1, 1> partials_t;
+        partials_t partials_;  // For univariate use-cases
+        broadcast_array<partials_t> partials_vec_;  // For multivariate
+        explicit ops_partials_edge(const Op& ops)
+          : partials_(partials_t::Zero(ops.size())),
+            partials_vec_(partials_), operands_(ops) {}
+
+      private:
+        template<typename, typename, typename, typename, typename>
+        friend class stan::math::operands_and_partials;
+        const Op& operands_;
+
+        Dx dx() {
+          Dx derivative(0);
+          for (size_t i = 0; i < this->operands_.size(); ++i) {
+            derivative += this->partials_[i] * this->operands_[i].d_;
+          }
+          return derivative;
+        }
+      };
+
+      template <typename Dx, int R, int C>
+      class ops_partials_edge<Dx, Eigen::Matrix<fvar<Dx>, R, C> > {
+      public:
+        typedef Eigen::Matrix<Dx, R, C> partials_t;
+        typedef Eigen::Matrix<fvar<Dx>, R, C> Op;
+        partials_t partials_;  // For univariate use-cases
+        broadcast_array<partials_t> partials_vec_;  // For multivariate
+        explicit ops_partials_edge(const Op& ops)
+          : partials_(partials_t::Zero(ops.rows(), ops.cols())),
+            partials_vec_(partials_), operands_(ops) {}
+
+      private:
+        template<typename, typename, typename, typename, typename>
+        friend class stan::math::operands_and_partials;
+        const Op& operands_;
+
+        Dx dx() {
+          Dx derivative(0);
+          for (int i = 0; i < this->operands_.size(); ++i) {
+            derivative += this->partials_(i) * this->operands_(i).d_;
+          }
+          return derivative;
+        }
+      };
+
+      // Multivariate; vectors of eigen types
+      template <typename Dx, int R, int C>
+      class ops_partials_edge
+      <Dx, std::vector<Eigen::Matrix<fvar<Dx>, R, C> > > {
+      public:
+        typedef std::vector<Eigen::Matrix<fvar<Dx>, R, C> > Op;
+        typedef Eigen::Matrix<Dx, -1, -1> partial_t;
+        std::vector<partial_t> partials_vec_;
+        explicit ops_partials_edge(const Op& ops)
+          : partials_vec_(ops.size()), operands_(ops) {
+          for (size_t i = 0; i < ops.size(); ++i) {
+            partials_vec_[i] = partial_t::Zero(ops[i].rows(), ops[i].cols());
+          }
+        }
+
+      private:
+        template<typename, typename, typename, typename, typename>
+        friend class stan::math::operands_and_partials;
+        const Op& operands_;
+
+        Dx dx() {
+          Dx derivative(0);
+          for (size_t i = 0; i < this->operands_.size(); ++i) {
+            for (int j = 0; j < this->operands_[i].size(); ++j) {
+              derivative
+                += this->partials_vec_[i](j) * this->operands_[i](j).d_;
+            }
+          }
+          return derivative;
+        }
+      };
+    }  // namespace internal
+  }  // namespace math
+}  // namespace stan
+#endif
diff --git a/stan/math/fwd/scal.hpp b/stan/math/fwd/scal.hpp
@@ -5,7 +5,7 @@
 #include <stan/math/fwd/scal/meta/ad_promotable.hpp>
 #include <stan/math/fwd/scal/meta/is_fvar.hpp>
 #include <stan/math/fwd/scal/meta/partials_type.hpp>
-#include <stan/math/fwd/scal/meta/OperandsAndPartials.hpp>
+#include <stan/math/fwd/scal/meta/operands_and_partials.hpp>
 
 #include <stan/math/prim/scal.hpp>
 

diff --git a/stan/math/fwd/scal/meta/OperandsAndPartials.hpp b/stan/math/fwd/scal/meta/OperandsAndPartials.hpp
diff --git a/stan/math/fwd/scal/meta/operands_and_partials.hpp b/stan/math/fwd/scal/meta/operands_and_partials.hpp
@@ -0,0 +1,98 @@
+#ifndef STAN_MATH_FWD_SCAL_META_OPERANDS_AND_PARTIALS_HPP
+#define STAN_MATH_FWD_SCAL_META_OPERANDS_AND_PARTIALS_HPP
+
+#include <stan/math/prim/scal/meta/broadcast_array.hpp>
+#include <stan/math/prim/scal/meta/operands_and_partials.hpp>
+#include <stan/math/fwd/core/fvar.hpp>
+
+namespace stan {
+  namespace math {
+    namespace internal {
+      template <typename Dx>
+      class ops_partials_edge<Dx, fvar<Dx> > {
+      public:
+        typedef fvar<Dx> Op;
+        Dx partial_;
+        broadcast_array<Dx> partials_;
+        explicit ops_partials_edge(const Op& op)
+          : partial_(0), partials_(partial_), operand_(op) {}
+
+      private:
+        template<typename, typename, typename, typename, typename>
+        friend class stan::math::operands_and_partials;
+        const Op& operand_;
+
+        Dx dx() {
+          return this->partials_[0] * this->operand_.d_;
+        }
+      };
+    }  // namespace internal
+
+    /**
+     * This class builds partial derivatives with respect to a set of
+     * operands. There are two reason for the generality of this
+     * class. The first is to handle vector and scalar arguments
+     * without needing to write additional code. The second is to use
+     * this class for writing probability distributions that handle
+     * primitives, reverse mode, and forward mode variables
+     * seamlessly.
+     *
+     * Conceptually, this class is used when we want to manually calculate
+     * the derivative of a function and store this manual result on the
+     * autodiff stack in a sort of "compressed" form. Think of it like an
+     * easy-to-use interface to rev/core/precomputed_gradients.
+     *
+     * This class now supports multivariate use-cases as well by
+     * exposing edge#_.partials_vec
+     *
+     * This is the specialization for when the return type is fvar,
+     * which should be for forward mode and all higher-order cases.
+     *
+     * @tparam Op1 type of the first operand
+     * @tparam Op2 type of the second operand
+     * @tparam Op3 type of the third operand
+     * @tparam Op4 type of the fourth operand
+     * @tparam T_return_type return type of the expression. This defaults
+     *   to a template metaprogram that calculates the scalar promotion of
+     *   Op1 -- Op4
+     */
+    template <typename Op1, typename Op2, typename Op3, typename Op4,
+              typename Dx>
+    class operands_and_partials<Op1, Op2, Op3, Op4, fvar<Dx> > {
+    public:
+      internal::ops_partials_edge<Dx, Op1> edge1_;
+      internal::ops_partials_edge<Dx, Op2> edge2_;
+      internal::ops_partials_edge<Dx, Op3> edge3_;
+      internal::ops_partials_edge<Dx, Op4> edge4_;
+      typedef fvar<Dx> T_return_type;
+      explicit operands_and_partials(const Op1& o1)
+        : edge1_(o1) { }
+      operands_and_partials(const Op1& o1, const Op2& o2)
+        : edge1_(o1), edge2_(o2) { }
+      operands_and_partials(const Op1& o1, const Op2& o2, const Op3& o3)
+        : edge1_(o1), edge2_(o2), edge3_(o3) { }
+      operands_and_partials(const Op1& o1, const Op2& o2, const Op3& o3,
+                            const Op4& o4)
+        : edge1_(o1), edge2_(o2), edge3_(o3), edge4_(o4) { }
+
+      /**
+       * Build the node to be stored on the autodiff graph.
+       * This should contain both the value and the tangent.
+       *
+       * For scalars, we don't calculate any tangents.
+       * For reverse mode, we end up returning a type of var that will calculate
+       * the appropriate adjoint using the stored operands and partials.
+       * Forward mode just calculates the tangent on the spot and returns it in
+       * a vanilla fvar.
+       *
+       * @param value the return value of the function we are compressing
+       * @return the value with its derivative
+       */
+      T_return_type build(Dx value) {
+        Dx deriv = edge1_.dx() + edge2_.dx() + edge3_.dx() + edge4_.dx();
+        return T_return_type(value, deriv);
+      }
+    };
+  }
+}
+#endif