diff --git a/doxygen/contributor_help_pages/common_pitfalls.md b/doxygen/contributor_help_pages/common_pitfalls.md
index f3e8fb817ad..3ce9e15569f 100644
--- a/doxygen/contributor_help_pages/common_pitfalls.md
+++ b/doxygen/contributor_help_pages/common_pitfalls.md
@@ -154,8 +154,6 @@ The implementation of @ref stan::math::make_holder is [here](https://github.com/
 
 ### Move Semantics
 
-In general, Stan Math does not use move semantics very often.
-This is because of our arena allocator.
 Move semantics generally work as
 
 ```cpp
@@ -179,6 +177,96 @@ We can see in the above that the standard style of a move (the constructor takin
 But in Stan, particularly for reverse mode, we need to keep memory around even if it's only temporary for when we call the gradient calculations in the reverse pass.
 And since memory for reverse mode is stored in our arena allocator no copying happens in the first place.
 
+Functions for Stan Math's reverse mode autodiff should use [_perfect forwarding_](https://drewcampbell92.medium.com/understanding-move-semantics-and-perfect-forwarding-part-3-65575d523ff8) arguments. Perfect forwarding arguments use a template parameter wit no attributes such as `const` and `volatile` and have a double ampersand `&&` next to them.
+
+```c++
+  template <typename T>
+  auto my_function(T&& x) {
+    return my_other_function(std::forward<T>(x));
+  }
+```
+
+The `std::forward<T>` in the in the code above tells the compiler that if `T` is deduced to be an rvalue reference (such as `Eigen::MatrixXd&&`), then it should be moved to `my_other_function`, where there it can possibly use another objects move constructor to reuse memory.
+A perfect forwarding argument of a function accepts any reference type as its input argument. 
+The above signature is equivalent to writing out several functions with different reference types
+
+```c++
+  // Accepts a plain lvalue reference
+  auto my_function(Eigen::MatrixXd& x) {
+    return my_other_function(x);
+  }
+  // Accepts a const lvalue reference
+  auto my_function(const Eigen::MatrixXd& x) {
+    return my_other_function(x);
+  }
+  // Accepts an rvalue reference
+  auto my_function(Eigen::MatrixXd&& x) {
+    return my_other_function(std::move(x));
+  }
+  // Accepts a const rvalue reference
+  auto my_function(const Eigen::MatrixXd&& x) {
+    return my_other_function(std::move(x));
+  }
+```
+
+In Stan, perfect forwarding is used in reverse mode functions which can accept an Eigen matrix type.
+
+```c++
+template <typename T, require_eigen_vt<is_var, T>* = nullptr>
+inline auto sin(T&& x) {
+  // Store `x` on the arena
+  arena_t<T> x_arena(std::forward<T>(x));
+  arena_t<T> ret(x_arena.val().array().sin().matrix());
+  reverse_pass_callback([x_arena, ret] mutable {
+    x_arena.adj() += ret.adj().cwiseProduct(x_arena.val().array().cos().matrix());
+  });
+  return ret;
+}
+```
+
+Let's go through the above line by line.
+
+```c++
+template <typename T, require_eigen_vt<is_var, T>* = nullptr>
+inline auto sin(T&& x) {
+```
+
+The signature for this function has a template `T` that is required to be an Eigen type with a `value_type` that is a `var` type. 
+The template parameter `T` is then used in the signature as an perfect forwarding argument. 
+
+```c++
+  // Store `x` on the arena
+  arena_t<T> x_arena(std::forward<T>(x));
+```
+
+The input is stored in the arena, which is where the perfect forwarding magic actually occurs. 
+If `T` is an lvalue type such as `Eigen::MatrixXd&` then `arena_matrix` will use it's copy constructor, creating new memory in Stan's arena allocator and then copying the values of `x` into that memory. 
+But if `T` was a temporary rvalue type such as `Eigen::MatrixXd&&`, then the `arena_matrix` class will use it's move constructor to place the temporary matrix in Stan's `var_alloc_stack_`. 
+The `var_alloc_stick_` is used to hold objects that were created outside of the arena allocator but need to be deleted when the arena allocator is cleared. 
+This allows the `arena_matrix` to reuse the memory from the temporary matrix. Then the matrix will be deleted once arena allocator requests memory to be cleared.
+
+```c++
+  arena_t<T> ret(x_arena.val().array().sin().matrix());
+```
+
+This construction of an `arena_matrix` will *not* use the move constructor for `arena_matrix`. 
+Here, `x_arena` is an `arena_matrix<T>`, which is then wrapped in an expression to compute the elementwise `sin`. 
+That expression will be evaluated into new memory allocated in the arena allocator and then a pointer to it will be stored in the `arena_matrix.`
+
+```c++
+  reverse_pass_callback([x_arena, ret] mutable {
+    x_arena.adj() += ret.adj().cwiseProduct(x_arena.val().array().cos().matrix());
+  });
+  return ret;
+```
+
+The rest of this code follows the standard format for the rest of Stan Math's reverse mode that accepts Eigen types as input. 
+The `reverse_pass_callback` function accepts a lambda as input and places the lambda in Stan's callback stack to be called later when `grad()` is called by the user.
+Since `arena_matrix` types only store a pointer to memory allocated elsewhere they are copied into the lambda. 
+The body of the lambda holds the gradient calculation needed for the reverse mode pass.
+
+Then finally `ret`, the `arena_matrix` type is returned by the function.
+
 When working with arithmetic types, keep in mind that moving Scalars is often less optimal than simply taking their copy.
 For instance, Stan's `var` type uses the pointer to implementation (PIMPL) pattern, so it simply holds a pointer of size 8 bytes.
 A `double` is also 8 bytes which just so happens to fit exactly in a [word](https://en.wikipedia.org/wiki/Word_(computer_architecture)) of most modern CPUs with at least 64-byte cache lines.
@@ -190,6 +278,45 @@ The general rules to follow for passing values to a function are:
 2. If you are writing a function for reverse mode, pass values by `const&`
 3. In prim, if you are confident and working with larger types, use perfect forwarding to pass values that can be moved from. Otherwise simply pass values by `const&`.
 
+### Using auto is Dangerous With Eigen Matrix Functions in Reverse Mode
+
+The use of auto with the Stan Math library should be used with care, like in [Eigen](https://eigen.tuxfamily.org/dox/TopicPitfalls.html). 
+Along with the cautions mentioned in the Eigen docs, there are also memory considerations when using reverse mode automatic differentiation. 
+When returning from a function in the Stan Math library with an Eigen matrix output with a scalar `var` type, the actual returned type will often be an `arena_matrix<Eigen::Matrix<...>>`. 
+The `arena_matrix` class is an Eigen matrix where the underlying array of memory is located in Stan's memory arena. 
+The `arena_matrix` that is returned by Math functions is normally the same one resting in the callback used to calculate gradients in the reverse pass.
+Directly changing the elements of this matrix would also change the memory the reverse pass callback sees which would result in incorrect calculations.
+
+The simple solution to this is that when you use a math library function that returns a matrix and then want to assign to any of the individual elements of the matrix, assign to an actual Eigen matrix type instead of using auto. 
+In the below example, we see the first case which uses auto and will change the memory of the `arena_matrix` returned in the callback for multiply's reverse mode.
+Directly below it is the safe version, which just directly assigns to an Eigen matrix type and is safe to do element insertion into.
+
+```c++
+Eigen::Matrix<var, -1, 1> y;
+Eigen::Matrix<var, -1, -1> X;
+// Bad!! Will change memory used by reverse pass callback within multiply!
+auto mu = multiply(X, y);
+mu(4) = 1.0;
+// Good! Will not change memory used by reverse pass callback within multiply
+Eigen::Matrix<var, -1, 1> mu_good = multiply(X, y);
+mu_good(4) = 1.0;
+```
+
+The reason we do this is for cases where function returns are passed to other functions. 
+An `arena_matrix` will always make a shallow copy when being constructed from another `arena_matrix`, which lets the functions avoid unnecessary copies.
+
+```c++
+Eigen::Matrix<var, -1, 1> y1;
+Eigen::Matrix<var, -1, -1> X1;
+Eigen::Matrix<var, -1, 1> y2;
+Eigen::Matrix<var, -1, -1> X2;
+auto mu1 = multiply(X1, y1);
+auto mu2 = multiply(X2, y2);
+// Inputs not copied in this case!
+auto z = add(mu1, mu2);
+```
+
+
 ### Passing variables that need destructors called after the reverse pass (`make_chainable_ptr`)
 
 When possible, non-arena variables should be copied to the arena to be used in the reverse pass.
@@ -242,22 +369,17 @@ grad();
 ```
 
 Now `res` is `innocent_return` and we've changed one of the elements of `innocent_return`, but that is also going to change the element of `res` which is being used in our reverse pass callback!
-The answer for this is simple but sadly requires a copy.
 
-```cpp
-template <typename EigVec, require_eigen_vt<is_var, EigVec>* = nullptr>
-inline var cool_fun(const EigVec& v) {
-  arena_t<EigVec> arena_v(v);
-  arena_t<EigVec> res = arena_v.val().array() * arena_v.val().array();
-  reverse_pass_callback([res, arena_v]() mutable {
-    arena_v.adj().array() += (2.0 * res.adj().array()) * arena_v.val().array();
-  });
-  return plain_type_t<EigVec>(res);
-}
-```
+Care must be taken by end users of Stan Math by using `auto` with caution. 
+When a user wishes to manipulate the coefficients of a matrix that is a return from a function in Stan Math, they should assign the matrix to a plain Eigen type.
 
-we make a deep copy of the return whose inner `vari` will not be the same, but the `var` will produce a new copy of the pointer to the `vari`.
-Now the user code above will be protected, and it is safe for them to assign to individual elements of the `auto` returned matrix.
+```c++
+Eigen::Matrix<var, -1, 1> x = Eigen::Matrix<double, -1, 1>::Random(5);
+Eigen::MatrixXd actually_innocent_return = cool_fun(x);
+actually_innocent_return.coeffRef(3) = var(3.0);
+auto still_unsafe_return = cool_fun2(actually_innocent_return);
+grad();
+```
 
 ### Const correctness, reverse mode autodiff, and arena types
 
diff --git a/lib/tbb_2020.3/STAN_CHANGES b/lib/tbb_2020.3/STAN_CHANGES
index 67193d07e32..bc82dfb5969 100644
--- a/lib/tbb_2020.3/STAN_CHANGES
+++ b/lib/tbb_2020.3/STAN_CHANGES
@@ -6,3 +6,10 @@ This file documents changes done for the stan-math project
 - build/windows.inc patches for RTools make:
   - L15 changed setting to use '?=', allowing override
   - L25,L113,L114 added additional '/' to each cmd flag
+
+- Support for Windows ARM64 with RTools:
+  - build/Makefile.tbb
+    - L94 Wrapped the use of `--version-script` export in conditional on non-WINARM64
+  - build/windows.gcc.ino
+    - L84 Wrapped the use of `-flifetime-dse` flag in conditional on non-WINARM64
+    
\ No newline at end of file
diff --git a/lib/tbb_2020.3/build/Makefile.tbb b/lib/tbb_2020.3/build/Makefile.tbb
index 1556899811a..cf889cc31a2 100644
--- a/lib/tbb_2020.3/build/Makefile.tbb
+++ b/lib/tbb_2020.3/build/Makefile.tbb
@@ -91,7 +91,11 @@ ifneq (,$(TBB.DEF))
 tbb.def: $(TBB.DEF) $(TBB.LST)
 	$(CPLUS) $(PREPROC_ONLY) $< $(CPLUS_FLAGS) $(INCLUDES) > $@
 
-LIB_LINK_FLAGS += $(EXPORT_KEY)tbb.def
+# LLVM on Windows doesn't need --version-script export
+# https://reviews.llvm.org/D63743
+ifeq (, $(WINARM64))
+  LIB_LINK_FLAGS += $(EXPORT_KEY)tbb.def
+endif
 $(TBB.DLL): tbb.def
 endif
 
diff --git a/lib/tbb_2020.3/build/windows.gcc.inc b/lib/tbb_2020.3/build/windows.gcc.inc
index dc123eedc9c..d882ceb920a 100644
--- a/lib/tbb_2020.3/build/windows.gcc.inc
+++ b/lib/tbb_2020.3/build/windows.gcc.inc
@@ -80,8 +80,11 @@ endif
 # gcc 6.0 and later have -flifetime-dse option that controls
 # elimination of stores done outside the object lifetime
 ifeq (ok,$(call detect_js,/minversion gcc 6.0))
-    # keep pre-contruction stores for zero initialization
-    DSE_KEY = -flifetime-dse=1
+    # Clang does not support -flifetime-dse
+    ifeq (, $(WINARM64))
+      # keep pre-contruction stores for zero initialization
+      DSE_KEY = -flifetime-dse=1
+    endif
 endif
 
 ifeq ($(cfg), release)
diff --git a/make/compiler_flags b/make/compiler_flags
index c6b9228a82c..0be4905ccee 100644
--- a/make/compiler_flags
+++ b/make/compiler_flags
@@ -17,6 +17,7 @@ endif
 
 ## Set OS specific library filename extensions
 ifeq ($(OS),Windows_NT)
+  WINARM64 := $(shell echo | $(CXX) -E -dM -  | findstr __aarch64__)
   LIBRARY_SUFFIX ?= .dll
 endif
 
@@ -271,8 +272,13 @@ CXXFLAGS_TBB ?= -I $(TBB_INC)
 else
 CXXFLAGS_TBB ?= -I $(TBB)/include
 endif
+LDFLAGS_TBB ?= -Wl,-L,"$(TBB_LIB)" -Wl,--disable-new-dtags
+
+# Windows LLVM/Clang does not support -rpath, but is not needed on Windows anyway
+ifeq ($(WINARM64),)
+  LDFLAGS_TBB += -Wl,-rpath,"$(TBB_LIB)"
+endif
 
-LDFLAGS_TBB ?= -Wl,-L,"$(TBB_LIB)" -Wl,-rpath,"$(TBB_LIB)" -Wl,--disable-new-dtags
 LDLIBS_TBB ?= -ltbb
 
 else
@@ -290,7 +296,12 @@ ifeq ($(OS),Linux)
 endif
 
 CXXFLAGS_TBB ?= -I $(TBB)/include
-LDFLAGS_TBB ?= -Wl,-L,"$(TBB_BIN_ABSOLUTE_PATH)" -Wl,-rpath,"$(TBB_BIN_ABSOLUTE_PATH)" $(LDFLAGS_FLTO_FLTO) $(LDFLAGS_OPTIM_TBB)
+LDFLAGS_TBB ?= -Wl,-L,"$(TBB_BIN_ABSOLUTE_PATH)" $(LDFLAGS_FLTO_FLTO) $(LDFLAGS_OPTIM_TBB)
+
+# Windows LLVM/Clang does not support -rpath, but is not needed on Windows anyway
+ifeq ($(WINARM64),)
+  LDFLAGS_TBB += -Wl,-rpath,"$(TBB_BIN_ABSOLUTE_PATH)"
+endif
 LDLIBS_TBB ?= -ltbb
 
 endif
diff --git a/make/libraries b/make/libraries
index 3e9b1d0d75d..10460c6c75b 100644
--- a/make/libraries
+++ b/make/libraries
@@ -23,6 +23,7 @@ CPPLINT ?= $(MATH)lib/cpplint_1.4.5
 #       Fortran bindings which we do not need for stan-math. Thus these targets
 #       are ignored here. This convention was introduced with 4.0.
 ##
+ifndef SUNDIALS_TARGETS
 
 SUNDIALS_CVODES := $(patsubst %.c,%.o,\
   $(wildcard $(SUNDIALS)/src/cvodes/*.c) \
@@ -87,7 +88,7 @@ $(STAN_SUNDIALS_HEADERS) : $(SUNDIALS_TARGETS)
 clean-sundials:
 	@echo '  cleaning sundials targets'
 	$(RM) $(wildcard $(sort $(SUNDIALS_CVODES) $(SUNDIALS_IDAS) $(SUNDIALS_KINSOL) $(SUNDIALS_NVECSERIAL) $(SUNDIALS_TARGETS)))
-
+endif
 
 ############################################################
 # TBB build rules
@@ -138,6 +139,11 @@ endif
 ifeq (Windows_NT, $(OS))
   ifeq ($(IS_UCRT),true)
     TBB_CXXFLAGS += -D_UCRT
+  endif
+  # TBB does not have assembly code for Windows ARM64, so we need to use GCC builtins
+  ifneq ($(WINARM64),)
+	TBB_CXXFLAGS += -DTBB_USE_GCC_BUILTINS
+	CXXFLAGS_TBB += -DTBB_USE_GCC_BUILTINS
   endif
 	SH_CHECK := $(shell command -v sh 2>/dev/null)
 	ifdef SH_CHECK
@@ -169,11 +175,11 @@ endif
 $(TBB_BIN)/tbb.def: $(TBB_BIN)/tbb-make-check
 	@mkdir -p $(TBB_BIN)
 	touch $(TBB_BIN)/version_$(notdir $(TBB))
-	tbb_root="$(TBB_RELATIVE_PATH)" CXX="$(CXX)" CC="$(TBB_CC)" LDFLAGS='$(LDFLAGS_TBB)' '$(MAKE)' -C "$(TBB_BIN)" -r -f "$(TBB_ABSOLUTE_PATH)/build/Makefile.tbb" compiler=$(TBB_CXX_TYPE) cfg=release stdver=c++1y  CXXFLAGS="$(TBB_CXXFLAGS)"
+	tbb_root="$(TBB_RELATIVE_PATH)" WINARM64="$(WINARM64)" CXX="$(CXX)" CC="$(TBB_CC)" LDFLAGS='$(LDFLAGS_TBB)' '$(MAKE)' -C "$(TBB_BIN)" -r -f "$(TBB_ABSOLUTE_PATH)/build/Makefile.tbb" compiler=$(TBB_CXX_TYPE) cfg=release stdver=c++1y  CXXFLAGS="$(TBB_CXXFLAGS)"
 
 $(TBB_BIN)/tbbmalloc.def: $(TBB_BIN)/tbb-make-check
 	@mkdir -p $(TBB_BIN)
-	tbb_root="$(TBB_RELATIVE_PATH)" CXX="$(CXX)" CC="$(TBB_CC)" LDFLAGS='$(LDFLAGS_TBB)' '$(MAKE)' -C "$(TBB_BIN)" -r -f "$(TBB_ABSOLUTE_PATH)/build/Makefile.tbbmalloc" compiler=$(TBB_CXX_TYPE) cfg=release stdver=c++1y malloc CXXFLAGS="$(TBB_CXXFLAGS)"
+	tbb_root="$(TBB_RELATIVE_PATH)" WINARM64="$(WINARM64)" CXX="$(CXX)" CC="$(TBB_CC)" LDFLAGS='$(LDFLAGS_TBB)' '$(MAKE)' -C "$(TBB_BIN)" -r -f "$(TBB_ABSOLUTE_PATH)/build/Makefile.tbbmalloc" compiler=$(TBB_CXX_TYPE) cfg=release stdver=c++1y malloc CXXFLAGS="$(TBB_CXXFLAGS)"
 
 $(TBB_BIN)/libtbb.dylib: $(TBB_BIN)/tbb.def
 $(TBB_BIN)/libtbbmalloc.dylib: $(TBB_BIN)/tbbmalloc.def
diff --git a/stan/math/prim/fun/value_of.hpp b/stan/math/prim/fun/value_of.hpp
index 7cc37ac9b2c..64286bbe0c3 100644
--- a/stan/math/prim/fun/value_of.hpp
+++ b/stan/math/prim/fun/value_of.hpp
@@ -67,7 +67,7 @@ inline auto value_of(const T& x) {
  * @param[in] M Matrix to be converted
  * @return Matrix of values
  **/
-template <typename EigMat, require_eigen_t<EigMat>* = nullptr,
+template <typename EigMat, require_eigen_dense_base_t<EigMat>* = nullptr,
           require_not_st_arithmetic<EigMat>* = nullptr>
 inline auto value_of(EigMat&& M) {
   return make_holder(
@@ -77,6 +77,28 @@ inline auto value_of(EigMat&& M) {
       std::forward<EigMat>(M));
 }
 
+template <typename EigMat, require_eigen_sparse_base_t<EigMat>* = nullptr,
+          require_not_st_arithmetic<EigMat>* = nullptr>
+inline auto value_of(EigMat&& M) {
+  auto&& M_ref = to_ref(M);
+  using scalar_t = decltype(value_of(std::declval<value_type_t<EigMat>>()));
+  promote_scalar_t<scalar_t, plain_type_t<EigMat>> ret(M_ref.rows(),
+                                                       M_ref.cols());
+  ret.reserve(M_ref.nonZeros());
+  for (int k = 0; k < M_ref.outerSize(); ++k) {
+    for (typename std::decay_t<EigMat>::InnerIterator it(M_ref, k); it; ++it) {
+      ret.insert(it.row(), it.col()) = value_of(it.valueRef());
+    }
+  }
+  ret.makeCompressed();
+  return ret;
+}
+template <typename EigMat, require_eigen_sparse_base_t<EigMat>* = nullptr,
+          require_st_arithmetic<EigMat>* = nullptr>
+inline auto value_of(EigMat&& M) {
+  return std::forward<EigMat>(M);
+}
+
 }  // namespace math
 }  // namespace stan
 
diff --git a/stan/math/prim/meta/is_arena_matrix.hpp b/stan/math/prim/meta/is_arena_matrix.hpp
index f9553a5b016..bd2acfe4c38 100644
--- a/stan/math/prim/meta/is_arena_matrix.hpp
+++ b/stan/math/prim/meta/is_arena_matrix.hpp
@@ -23,5 +23,17 @@ template <typename T>
 using require_arena_matrix_t = require_t<is_arena_matrix<std::decay_t<T>>>;
 /*! @} */
 
+/*! \ingroup require_eigen_types */
+/*! \defgroup arena_matrix_types arena_matrix  */
+/*! \addtogroup arena_matrix_types */
+/*! @{ */
+
+/*! \brief Require type does not satisfy @ref is_arena_matrix */
+/*! @tparam T the type to check */
+template <typename T>
+using require_not_arena_matrix_t
+    = require_t<bool_constant<!is_arena_matrix<std::decay_t<T>>::value>>;
+/*! @} */
+
 }  // namespace stan
 #endif
diff --git a/stan/math/prim/meta/is_eigen_dense_base.hpp b/stan/math/prim/meta/is_eigen_dense_base.hpp
index 7b1ebc6cd1e..940f65bb2ef 100644
--- a/stan/math/prim/meta/is_eigen_dense_base.hpp
+++ b/stan/math/prim/meta/is_eigen_dense_base.hpp
@@ -33,6 +33,22 @@ using require_eigen_dense_base_t
     = require_t<is_eigen_dense_base<std::decay_t<T>>>;
 /*! @} */
 
+/*! \ingroup require_eigens_types */
+/*! \defgroup eigen_dense_base_types eigen_dense_base_types  */
+/*! \addtogroup eigen_dense_base_types */
+/*! @{ */
+
+/*! \brief Require type satisfies @ref is_eigen_dense_base */
+/*! and value type satisfies `TypeCheck` */
+/*! @tparam TypeCheck The type trait to check the value type against */
+/*! @tparam Check The type to test @ref is_eigen_dense_base for and whose
+ * @ref value_type is checked with `TypeCheck` */
+template <template <class...> class TypeCheck, class... Check>
+using require_eigen_dense_base_vt
+    = require_t<container_type_check_base<is_eigen_dense_base, value_type_t,
+                                          TypeCheck, Check...>>;
+/*! @} */
+
 }  // namespace stan
 
 #endif
diff --git a/stan/math/prim/meta/promote_scalar_type.hpp b/stan/math/prim/meta/promote_scalar_type.hpp
index fee623ab141..fbcbbe1f749 100644
--- a/stan/math/prim/meta/promote_scalar_type.hpp
+++ b/stan/math/prim/meta/promote_scalar_type.hpp
@@ -4,6 +4,8 @@
 #include <stan/math/prim/fun/Eigen.hpp>
 #include <stan/math/prim/meta/is_eigen.hpp>
 #include <stan/math/prim/meta/is_var.hpp>
+#include <stan/math/prim/meta/is_eigen_dense_base.hpp>
+#include <stan/math/prim/meta/is_eigen_sparse_base.hpp>
 #include <vector>
 
 namespace stan {
@@ -80,7 +82,7 @@ struct promote_scalar_type<T, S,
  * @tparam S input matrix type
  */
 template <typename T, typename S>
-struct promote_scalar_type<T, S, require_eigen_t<S>> {
+struct promote_scalar_type<T, S, require_eigen_dense_base_t<S>> {
   /**
    * The promoted type.
    */
@@ -93,6 +95,16 @@ struct promote_scalar_type<T, S, require_eigen_t<S>> {
                    S::RowsAtCompileTime, S::ColsAtCompileTime>>::type;
 };
 
+template <typename T, typename S>
+struct promote_scalar_type<T, S, require_eigen_sparse_base_t<S>> {
+  /**
+   * The promoted type.
+   */
+  using type = Eigen::SparseMatrix<
+      typename promote_scalar_type<T, typename S::Scalar>::type, S::Options,
+      typename S::StorageIndex>;
+};
+
 template <typename... PromotionScalars, typename... UnPromotedTypes>
 struct promote_scalar_type<std::tuple<PromotionScalars...>,
                            std::tuple<UnPromotedTypes...>> {
diff --git a/stan/math/prim/prob/normal_lpdf.hpp b/stan/math/prim/prob/normal_lpdf.hpp
index 069a0f80599..f53c521a74e 100644
--- a/stan/math/prim/prob/normal_lpdf.hpp
+++ b/stan/math/prim/prob/normal_lpdf.hpp
@@ -41,9 +41,8 @@ namespace math {
 template <bool propto, typename T_y, typename T_loc, typename T_scale,
           require_all_not_nonscalar_prim_or_rev_kernel_expression_t<
               T_y, T_loc, T_scale>* = nullptr>
-inline return_type_t<T_y, T_loc, T_scale> normal_lpdf(const T_y& y,
-                                                      const T_loc& mu,
-                                                      const T_scale& sigma) {
+inline return_type_t<T_y, T_loc, T_scale> normal_lpdf(T_y&& y, T_loc&& mu,
+                                                      T_scale&& sigma) {
   using T_partials_return = partials_return_t<T_y, T_loc, T_scale>;
   using T_y_ref = ref_type_if_not_constant_t<T_y>;
   using T_mu_ref = ref_type_if_not_constant_t<T_loc>;
@@ -51,9 +50,9 @@ inline return_type_t<T_y, T_loc, T_scale> normal_lpdf(const T_y& y,
   static constexpr const char* function = "normal_lpdf";
   check_consistent_sizes(function, "Random variable", y, "Location parameter",
                          mu, "Scale parameter", sigma);
-  T_y_ref y_ref = y;
-  T_mu_ref mu_ref = mu;
-  T_sigma_ref sigma_ref = sigma;
+  T_y_ref y_ref = std::forward<T_y>(y);
+  T_mu_ref mu_ref = std::forward<T_loc>(mu);
+  T_sigma_ref sigma_ref = std::forward<T_scale>(sigma);
 
   decltype(auto) y_val = to_ref(as_value_column_array_or_scalar(y_ref));
   decltype(auto) mu_val = to_ref(as_value_column_array_or_scalar(mu_ref));
@@ -63,7 +62,7 @@ inline return_type_t<T_y, T_loc, T_scale> normal_lpdf(const T_y& y,
   check_finite(function, "Location parameter", mu_val);
   check_positive(function, "Scale parameter", sigma_val);
 
-  if (size_zero(y, mu, sigma)) {
+  if (size_zero(y_ref, mu_ref, sigma_ref)) {
     return 0.0;
   }
   if (!include_summand<propto, T_y, T_loc, T_scale>::value) {
@@ -78,7 +77,7 @@ inline return_type_t<T_y, T_loc, T_scale> normal_lpdf(const T_y& y,
   const auto& y_scaled_sq
       = to_ref_if<!is_constant_all<T_scale>::value>(y_scaled * y_scaled);
 
-  size_t N = max_size(y, mu, sigma);
+  size_t N = max_size(y_ref, mu_ref, sigma_ref);
   T_partials_return logp = -0.5 * sum(y_scaled_sq);
   if (include_summand<propto>::value) {
     logp += NEG_LOG_SQRT_TWO_PI * N;
@@ -106,10 +105,10 @@ inline return_type_t<T_y, T_loc, T_scale> normal_lpdf(const T_y& y,
 }
 
 template <typename T_y, typename T_loc, typename T_scale>
-inline return_type_t<T_y, T_loc, T_scale> normal_lpdf(const T_y& y,
-                                                      const T_loc& mu,
-                                                      const T_scale& sigma) {
-  return normal_lpdf<false>(y, mu, sigma);
+inline return_type_t<T_y, T_loc, T_scale> normal_lpdf(T_y&& y, T_loc&& mu,
+                                                      T_scale&& sigma) {
+  return normal_lpdf<false>(std::forward<T_y>(y), std::forward<T_loc>(mu),
+                            std::forward<T_scale>(sigma));
 }
 
 }  // namespace math
diff --git a/stan/math/rev/core/arena_matrix.hpp b/stan/math/rev/core/arena_matrix.hpp
index 69baf5b81c0..8913d4adc70 100644
--- a/stan/math/rev/core/arena_matrix.hpp
+++ b/stan/math/rev/core/arena_matrix.hpp
@@ -4,9 +4,9 @@
 #include <stan/math/prim/fun/Eigen.hpp>
 #include <stan/math/rev/core/chainable_alloc.hpp>
 #include <stan/math/rev/core/chainablestack.hpp>
+#include <stan/math/rev/core/chainable_object.hpp>
 #include <stan/math/rev/core/var_value_fwd_declare.hpp>
 #include <stan/math/prim/fun/to_ref.hpp>
-
 namespace stan {
 namespace math {
 
@@ -49,25 +49,91 @@ class arena_matrix<MatrixType, require_eigen_dense_base_t<MatrixType>>
           ChainableStack::instance_->memalloc_.alloc_array<Scalar>(size),
           size) {}
 
+ private:
+  template <typename T>
+  constexpr auto get_rows(const T& x) {
+    return (RowsAtCompileTime == 1 && T::ColsAtCompileTime == 1)
+                   || (ColsAtCompileTime == 1 && T::RowsAtCompileTime == 1)
+               ? x.cols()
+               : x.rows();
+  }
+  template <typename T>
+  constexpr auto get_cols(const T& x) {
+    return (RowsAtCompileTime == 1 && T::ColsAtCompileTime == 1)
+                   || (ColsAtCompileTime == 1 && T::RowsAtCompileTime == 1)
+               ? x.rows()
+               : x.cols();
+  }
+
+ public:
   /**
-   * Constructs `arena_matrix` from an expression.
+   * Constructs `arena_matrix` from an expression
    * @param other expression
    */
   template <typename T, require_eigen_t<T>* = nullptr>
   arena_matrix(const T& other)  // NOLINT
-      : Base::Map(
-          ChainableStack::instance_->memalloc_.alloc_array<Scalar>(
-              other.size()),
-          (RowsAtCompileTime == 1 && T::ColsAtCompileTime == 1)
-                  || (ColsAtCompileTime == 1 && T::RowsAtCompileTime == 1)
-              ? other.cols()
-              : other.rows(),
-          (RowsAtCompileTime == 1 && T::ColsAtCompileTime == 1)
-                  || (ColsAtCompileTime == 1 && T::RowsAtCompileTime == 1)
-              ? other.rows()
-              : other.cols()) {
+      : Base::Map(ChainableStack::instance_->memalloc_.alloc_array<Scalar>(
+                      other.size()),
+                  get_rows(other), get_cols(other)) {
     *this = other;
   }
+  /**
+   * Overwrite the current arena_matrix with new memory and assign a matrix to
+   * it
+   * @tparam T An eigen type inheriting from `Eigen::EigenBase`
+   * @param other A matrix that will be copied over to the arena allocator
+   */
+  template <typename T, require_eigen_t<T>* = nullptr>
+  arena_matrix& operator=(const T& other) {
+    new (this) Base(
+        ChainableStack::instance_->memalloc_.alloc_array<Scalar>(other.size()),
+        get_rows(other), get_cols(other));
+    Base::operator=(other);
+    return *this;
+  }
+
+  /**
+   * Constructs `arena_matrix` from an rvalue expression that is a `plain_type`,
+   *  then movies it to the object stack.
+   * @tparam T A type that inherits from Eigen::DenseBase that is not an
+   * `arena_matrix`.
+   * @param other expression
+   * @note When T is both an rvalue and a plain type, the expression is moved to
+   * the object stack.
+   */
+  template <typename T, require_eigen_t<T>* = nullptr,
+            require_not_arena_matrix_t<T>* = nullptr,
+            require_t<std::is_rvalue_reference<T&&>>* = nullptr,
+            require_plain_type_t<T>* = nullptr,
+            require_same_t<T, MatrixType>* = nullptr>
+  arena_matrix(T&& other)  // NOLINT
+      : Base::Map([](auto&& x) {
+          using base_map_t =
+              typename stan::math::arena_matrix<MatrixType>::Base;
+          auto other_ptr = make_chainable_ptr(std::move(x));
+          // other has it's rows and cols swapped already if it needed that
+          return base_map_t(&(other_ptr->coeffRef(0)), other_ptr->rows(),
+                            other_ptr->cols());
+        }(std::move(other))) {}
+
+  /**
+   * Assignment operator for assigning an expression.
+   * This is for rvalue plain type objects that can be moved over to the object
+   * stack instead of allocating new memory.
+   * @param other expression to evaluate into this
+   * @return `*this`
+   */
+  template <typename T, require_eigen_t<T>* = nullptr,
+            require_not_arena_matrix_t<T>* = nullptr,
+            require_t<std::is_rvalue_reference<T&&>>* = nullptr,
+            require_plain_type_t<T>* = nullptr,
+            require_same_t<T, MatrixType>* = nullptr>
+  arena_matrix& operator=(T&& other) {
+    auto other_ptr = make_chainable_ptr(std::move(other));
+    new (this)
+        Base(&(other_ptr->coeffRef(0)), other_ptr->rows(), other_ptr->cols());
+    return *this;
+  }
 
   /**
    * Constructs `arena_matrix` from an expression. This makes an assumption that
@@ -101,29 +167,6 @@ class arena_matrix<MatrixType, require_eigen_dense_base_t<MatrixType>>
     return *this;
   }
 
-  /**
-   * Assignment operator for assigning an expression.
-   * @param a expression to evaluate into this
-   * @return `*this`
-   */
-  template <typename T>
-  arena_matrix& operator=(const T& a) {
-    // do we need to transpose?
-    if ((RowsAtCompileTime == 1 && T::ColsAtCompileTime == 1)
-        || (ColsAtCompileTime == 1 && T::RowsAtCompileTime == 1)) {
-      // placement new changes what data map points to - there is no allocation
-      new (this) Base(
-          ChainableStack::instance_->memalloc_.alloc_array<Scalar>(a.size()),
-          a.cols(), a.rows());
-
-    } else {
-      new (this) Base(
-          ChainableStack::instance_->memalloc_.alloc_array<Scalar>(a.size()),
-          a.rows(), a.cols());
-    }
-    Base::operator=(a);
-    return *this;
-  }
   /**
    * Forces hard copying matrices into an arena matrix
    * @tparam T Any type assignable to `Base`
@@ -225,8 +268,10 @@ class arena_matrix<MatrixType, require_eigen_sparse_base_t<MatrixType>>
    */
   arena_matrix(const arena_matrix<MatrixType>& other)
       : Base::Map(other.rows(), other.cols(), other.nonZeros(),
-                  other.outerIndexPtr(), other.innerIndexPtr(),
-                  other.valuePtr(), other.innernonZeroPtr()) {}
+                  const_cast<StorageIndex*>(other.outerIndexPtr()),
+                  const_cast<StorageIndex*>(other.innerIndexPtr()),
+                  const_cast<Scalar*>(other.valuePtr()),
+                  const_cast<StorageIndex*>(other.innerNonZeroPtr())) {}
   /**
    * Move constructor.
    * @note Since the memory for the arena matrix sits in Stan's memory arena all
@@ -235,8 +280,10 @@ class arena_matrix<MatrixType, require_eigen_sparse_base_t<MatrixType>>
    */
   arena_matrix(arena_matrix<MatrixType>&& other)
       : Base::Map(other.rows(), other.cols(), other.nonZeros(),
-                  other.outerIndexPtr(), other.innerIndexPtr(),
-                  other.valuePtr(), other.innerNonZeroPtr()) {}
+                  const_cast<StorageIndex*>(other.outerIndexPtr()),
+                  const_cast<StorageIndex*>(other.innerIndexPtr()),
+                  const_cast<Scalar*>(other.valuePtr()),
+                  const_cast<StorageIndex*>(other.innerNonZeroPtr())) {}
   /**
    * Copy constructor. No actual copy is performed
    * @note Since the memory for the arena matrix sits in Stan's memory arena all
@@ -245,8 +292,10 @@ class arena_matrix<MatrixType, require_eigen_sparse_base_t<MatrixType>>
    */
   arena_matrix(arena_matrix<MatrixType>& other)
       : Base::Map(other.rows(), other.cols(), other.nonZeros(),
-                  other.outerIndexPtr(), other.innerIndexPtr(),
-                  other.valuePtr(), other.innerNonZeroPtr()) {}
+                  const_cast<StorageIndex*>(other.outerIndexPtr()),
+                  const_cast<StorageIndex*>(other.innerIndexPtr()),
+                  const_cast<Scalar*>(other.valuePtr()),
+                  const_cast<StorageIndex*>(other.innerNonZeroPtr())) {}
 
   // without this using, compiler prefers combination of implicit construction
   // and copy assignment to the inherited operator when assigned an expression
@@ -259,7 +308,8 @@ class arena_matrix<MatrixType, require_eigen_sparse_base_t<MatrixType>>
    * @return `*this`
    */
   template <typename ArenaMatrix,
-            require_same_t<ArenaMatrix, arena_matrix<MatrixType>>* = nullptr>
+            require_same_t<std::decay_t<ArenaMatrix>,
+                           arena_matrix<MatrixType>>* = nullptr>
   arena_matrix& operator=(ArenaMatrix&& other) {
     // placement new changes what data map points to - there is no allocation
     new (this) Base(other.rows(), other.cols(), other.nonZeros(),
@@ -280,7 +330,7 @@ class arena_matrix<MatrixType, require_eigen_sparse_base_t<MatrixType>>
   template <typename Expr,
             require_not_same_t<Expr, arena_matrix<MatrixType>>* = nullptr>
   arena_matrix& operator=(Expr&& expr) {
-    *this = arena_matrix(std::forward<Expr>(expr));
+    new (this) arena_matrix(std::forward<Expr>(expr));
     return *this;
   }
 
diff --git a/stan/math/rev/core/chainable_object.hpp b/stan/math/rev/core/chainable_object.hpp
index 0631d88354c..d4e22bb966d 100644
--- a/stan/math/rev/core/chainable_object.hpp
+++ b/stan/math/rev/core/chainable_object.hpp
@@ -1,11 +1,9 @@
 #ifndef STAN_MATH_REV_CORE_CHAINABLE_OBJECT_HPP
 #define STAN_MATH_REV_CORE_CHAINABLE_OBJECT_HPP
 
-#include <stan/math/rev/meta.hpp>
-#include <stan/math/rev/core/chainable_alloc.hpp>
-#include <stan/math/rev/core/typedefs.hpp>
 #include <stan/math/prim/fun/Eigen.hpp>
-#include <stan/math/prim/fun/typedefs.hpp>
+#include <stan/math/prim/meta.hpp>
+#include <stan/math/rev/core/chainable_alloc.hpp>
 #include <vector>
 
 namespace stan {
diff --git a/stan/math/rev/core/operator_addition.hpp b/stan/math/rev/core/operator_addition.hpp
index 2ecf9204379..458fc3c5ce3 100644
--- a/stan/math/rev/core/operator_addition.hpp
+++ b/stan/math/rev/core/operator_addition.hpp
@@ -108,12 +108,12 @@ inline var operator+(Arith a, const var& b) {
  */
 template <typename VarMat1, typename VarMat2,
           require_all_rev_matrix_t<VarMat1, VarMat2>* = nullptr>
-inline auto add(const VarMat1& a, const VarMat2& b) {
+inline auto add(VarMat1&& a, VarMat2&& b) {
   check_matching_dims("add", "a", a, "b", b);
   using op_ret_type = decltype(a.val() + b.val());
   using ret_type = return_var_matrix_t<op_ret_type, VarMat1, VarMat2>;
-  arena_t<VarMat1> arena_a(a);
-  arena_t<VarMat2> arena_b(b);
+  arena_t<VarMat1> arena_a(std::forward<VarMat1>(a));
+  arena_t<VarMat2> arena_b(std::forward<VarMat2>(b));
   arena_t<ret_type> ret(arena_a.val() + arena_b.val());
   reverse_pass_callback([ret, arena_a, arena_b]() mutable {
     for (Eigen::Index j = 0; j < ret.cols(); ++j) {
@@ -124,7 +124,7 @@ inline auto add(const VarMat1& a, const VarMat2& b) {
       }
     }
   });
-  return ret_type(ret);
+  return ret;
 }
 
 /**
@@ -139,18 +139,18 @@ inline auto add(const VarMat1& a, const VarMat2& b) {
 template <typename Arith, typename VarMat,
           require_st_arithmetic<Arith>* = nullptr,
           require_rev_matrix_t<VarMat>* = nullptr>
-inline auto add(const VarMat& a, const Arith& b) {
+inline auto add(VarMat&& a, const Arith& b) {
   if (is_eigen<Arith>::value) {
     check_matching_dims("add", "a", a, "b", b);
   }
   using op_ret_type
       = decltype((a.val().array() + as_array_or_scalar(b)).matrix());
   using ret_type = return_var_matrix_t<op_ret_type, VarMat>;
-  arena_t<VarMat> arena_a(a);
+  arena_t<VarMat> arena_a(std::forward<VarMat>(a));
   arena_t<ret_type> ret(arena_a.val().array() + as_array_or_scalar(b));
   reverse_pass_callback(
       [ret, arena_a]() mutable { arena_a.adj() += ret.adj_op(); });
-  return ret_type(ret);
+  return ret;
 }
 
 /**
@@ -165,8 +165,8 @@ inline auto add(const VarMat& a, const Arith& b) {
 template <typename Arith, typename VarMat,
           require_st_arithmetic<Arith>* = nullptr,
           require_rev_matrix_t<VarMat>* = nullptr>
-inline auto add(const Arith& a, const VarMat& b) {
-  return add(b, a);
+inline auto add(const Arith& a, VarMat&& b) {
+  return add(std::forward<VarMat>(b), a);
 }
 
 /**
@@ -185,7 +185,7 @@ inline auto add(const Var& a, const EigMat& b) {
   using ret_type = return_var_matrix_t<EigMat>;
   arena_t<ret_type> ret(a.val() + b.array());
   reverse_pass_callback([ret, a]() mutable { a.adj() += ret.adj().sum(); });
-  return ret_type(ret);
+  return ret;
 }
 
 /**
@@ -217,9 +217,9 @@ inline auto add(const EigMat& a, const Var& b) {
 template <typename Var, typename VarMat,
           require_var_vt<std::is_arithmetic, Var>* = nullptr,
           require_rev_matrix_t<VarMat>* = nullptr>
-inline auto add(const Var& a, const VarMat& b) {
+inline auto add(const Var& a, VarMat&& b) {
   using ret_type = return_var_matrix_t<VarMat>;
-  arena_t<VarMat> arena_b(b);
+  arena_t<VarMat> arena_b(std::forward<VarMat>(b));
   arena_t<ret_type> ret(a.val() + arena_b.val().array());
   reverse_pass_callback([ret, a, arena_b]() mutable {
     for (Eigen::Index j = 0; j < ret.cols(); ++j) {
@@ -230,7 +230,7 @@ inline auto add(const Var& a, const VarMat& b) {
       }
     }
   });
-  return ret_type(ret);
+  return ret;
 }
 
 /**
@@ -246,8 +246,8 @@ inline auto add(const Var& a, const VarMat& b) {
 template <typename Var, typename VarMat,
           require_var_vt<std::is_arithmetic, Var>* = nullptr,
           require_rev_matrix_t<VarMat>* = nullptr>
-inline auto add(const VarMat& a, const Var& b) {
-  return add(b, a);
+inline auto add(VarMat&& a, const Var& b) {
+  return add(b, std::forward<VarMat>(a));
 }
 
 template <typename T1, typename T2,
@@ -274,8 +274,8 @@ inline auto add(const T1& a, const T2& b) {
  */
 template <typename VarMat1, typename VarMat2,
           require_any_var_matrix_t<VarMat1, VarMat2>* = nullptr>
-inline auto operator+(const VarMat1& a, const VarMat2& b) {
-  return add(a, b);
+inline auto operator+(VarMat1&& a, VarMat2&& b) {
+  return add(std::forward<VarMat1>(a), std::forward<VarMat2>(b));
 }
 
 }  // namespace math
diff --git a/stan/math/rev/core/var.hpp b/stan/math/rev/core/var.hpp
index c56d4f09a42..bce9283225d 100644
--- a/stan/math/rev/core/var.hpp
+++ b/stan/math/rev/core/var.hpp
@@ -418,6 +418,18 @@ class var_value<T, internal::require_matrix_var_value<T>> {
         });
   }
 
+  /**
+   * Construct a `var_value` with premade @ref arena_matrix types.
+   *  The values and adjoint matrices passed here will be shallow copied.
+   * @tparam S type of the value in the `var_value` to assing
+   * @param val The value matrix to go into the vari
+   * @param adj the adjoint matrix to go into the vari
+   */
+  template <typename S, typename T_ = T,
+            require_assignable_t<value_type, S>* = nullptr,
+            require_arena_matrix_t<S>* = nullptr>
+  var_value(const S& val, const S& adj) : vi_(new vari_type(val, adj)) {}
+
   /**
    * Construct a variable from a pointer to a variable implementation.
    * @param vi A vari_value pointer.
diff --git a/stan/math/rev/core/vari.hpp b/stan/math/rev/core/vari.hpp
index 80da3b0f46d..cef37d29a31 100644
--- a/stan/math/rev/core/vari.hpp
+++ b/stan/math/rev/core/vari.hpp
@@ -821,17 +821,16 @@ class vari_value<T, require_eigen_sparse_base_t<T>> : public vari_base {
    */
   static constexpr int ColsAtCompileTime = T::ColsAtCompileTime;
 
+  /**
+   * The value of this variable.
+   */
+  arena_matrix<PlainObject> val_;
   /**
    * The adjoint of this variable, which is the partial derivative
    * of this variable with respect to the root variable.
    */
   arena_matrix<PlainObject> adj_;
 
-  /**
-   * The value of this variable.
-   */
-  arena_matrix<PlainObject> val_;
-
   /**
    * Construct a variable implementation from a value. The
    * adjoint is initialized to zero.
@@ -847,10 +846,21 @@ class vari_value<T, require_eigen_sparse_base_t<T>> : public vari_base {
    * @param x Value of the constructed variable.
    */
   template <typename S, require_convertible_t<S&, T>* = nullptr>
-  explicit vari_value(S&& x) : adj_(x), val_(std::forward<S>(x)) {
-    this->set_zero_adjoint();
+  explicit vari_value(S&& x)
+      : val_(std::forward<S>(x)),
+        adj_(val_.rows(), val_.cols(), val_.nonZeros(), val_.outerIndexPtr(),
+             val_.innerIndexPtr(),
+             arena_matrix<Eigen::VectorXd>(val_.nonZeros()).setZero().data(),
+             val_.innerNonZeroPtr()) {
+    ChainableStack::instance_->var_stack_.push_back(this);
+  }
+
+  vari_value(const arena_matrix<PlainObject>& val,
+             const arena_matrix<PlainObject>& adj)
+      : val_(val), adj_(adj) {
     ChainableStack::instance_->var_stack_.push_back(this);
   }
+
   /**
    * Construct an sparse Eigen variable implementation from a value. The
    *  adjoint is initialized to zero and if `stacked` is `false` this vari
@@ -869,8 +879,12 @@ class vari_value<T, require_eigen_sparse_base_t<T>> : public vari_base {
    * that its `chain()` method is not called.
    */
   template <typename S, require_convertible_t<S&, T>* = nullptr>
-  vari_value(S&& x, bool stacked) : adj_(x), val_(std::forward<S>(x)) {
-    this->set_zero_adjoint();
+  vari_value(S&& x, bool stacked)
+      : val_(std::forward<S>(x)),
+        adj_(val_.rows(), val_.cols(), val_.nonZeros(), val_.outerIndexPtr(),
+             val_.innerIndexPtr(),
+             arena_matrix<Eigen::VectorXd>(val_.nonZeros()).setZero().data(),
+             val_.innerNonZeroPtr()) {
     if (stacked) {
       ChainableStack::instance_->var_stack_.push_back(this);
     } else {
diff --git a/stan/math/rev/fun.hpp b/stan/math/rev/fun.hpp
index 4893ddc0540..929e88aa4c3 100644
--- a/stan/math/rev/fun.hpp
+++ b/stan/math/rev/fun.hpp
@@ -169,6 +169,7 @@
 #include <stan/math/rev/fun/tgamma.hpp>
 #include <stan/math/rev/fun/to_var.hpp>
 #include <stan/math/rev/fun/to_arena.hpp>
+#include <stan/math/rev/fun/to_soa_sparse_matrix.hpp>
 #include <stan/math/rev/fun/to_var_value.hpp>
 #include <stan/math/rev/fun/to_vector.hpp>
 #include <stan/math/rev/fun/trace.hpp>
diff --git a/stan/math/rev/fun/csr_matrix_times_vector.hpp b/stan/math/rev/fun/csr_matrix_times_vector.hpp
index d0cb4bd2373..4665c7a4dbd 100644
--- a/stan/math/rev/fun/csr_matrix_times_vector.hpp
+++ b/stan/math/rev/fun/csr_matrix_times_vector.hpp
@@ -2,6 +2,7 @@
 #define STAN_MATH_REV_FUN_CSR_MATRIX_TIMES_VECTOR_HPP
 
 #include <stan/math/prim/fun/Eigen.hpp>
+#include <stan/math/rev/fun/to_soa_sparse_matrix.hpp>
 #include <stan/math/rev/core.hpp>
 #include <stan/math/prim/err.hpp>
 #include <stan/math/prim/fun/csr_u_to_z.hpp>
@@ -11,37 +12,116 @@ namespace stan {
 namespace math {
 
 namespace internal {
-template <typename T1, typename T2, typename Res,
-          require_eigen_t<T1>* = nullptr>
-void update_w(T1& w, int m, int n, std::vector<int, arena_allocator<int>>& u,
-              std::vector<int, arena_allocator<int>>& v, T2&& b, Res&& res) {
-  Eigen::Map<Eigen::SparseMatrix<var, Eigen::RowMajor>> w_mat(
-      m, n, w.size(), u.data(), v.data(), w.data());
-  for (int k = 0; k < w_mat.outerSize(); ++k) {
-    for (Eigen::Map<Eigen::SparseMatrix<var, Eigen::RowMajor>>::InnerIterator
-             it(w_mat, k);
-         it; ++it) {
-      it.valueRef().adj()
-          += res.adj().coeff(it.row()) * value_of(b).coeff(it.col());
-    }
+/**
+ * `vari` for csr_matrix_times_vector
+ * @note `csr_matrix_times_vector` uses the old inheritance
+ *  style to set up the reverse pass because of a linking
+ *  issue on windows when using flto.
+ *
+ * @tparam Result_ Either a type inheriting from `Eigen::DenseBase` with scalar
+ * type `var` or a `var<T>` where `T` inherits from `Eigen::DenseBase`
+ * @tparam WMat_ Either a type inheriting from `Eigen::DenseBase` with scalar
+ * type `var` or `double`. Or a `var<T>` where `T` inherits from
+ * `Eigen::SparseBase`
+ * @tparam B_ Either a type inheriting from `Eigen::DenseBase` with scalar type
+ * `var` or `double`. Or a `var<T>` where `T` inherits from `Eigen::DenseBase`
+ *
+ */
+template <typename Result_, typename WMat_, typename B_>
+struct csr_adjoint : public vari {
+  std::decay_t<Result_> res_;
+  std::decay_t<WMat_> w_mat_;
+  std::decay_t<B_> b_;
+
+  template <typename T1, typename T2, typename T3>
+  csr_adjoint(T1&& res, T2&& w_mat, T3&& b)
+      : vari(0.0),
+        res_(std::forward<T1>(res)),
+        w_mat_(std::forward<T2>(w_mat)),
+        b_(std::forward<T3>(b)) {}
+
+  void chain() { chain_internal(res_, w_mat_, b_); }
+
+  /**
+   * Overload for calculating adjoints of `w_mat` and `b`
+   * @tparam Result Either a type inheriting from `Eigen::DenseBase` with scalar
+   * type `var` or a `var<T>` where `T` inherits from `Eigen::DenseBase`
+   * @tparam WMat Either a type inheriting from `Eigen::DenseBase` with scalar
+   * type `var`. Or a `var<T>` where `T` inherits from `Eigen::SparseBase`
+   * @tparam B Either a type inheriting from `Eigen::DenseBase` with scalar type
+   * `var`. Or a `var<T>` where `T` inherits from `Eigen::DenseBase`
+   * @param res The vector result of the forward pass calculation
+   * @param w_mat A sparse matrix
+   * @param b A vector
+   */
+  template <typename Result, typename WMat, typename B,
+            require_rev_matrix_t<WMat>* = nullptr,
+            require_rev_matrix_t<B>* = nullptr>
+  inline void chain_internal(Result&& res, WMat&& w_mat, B&& b) {
+    w_mat.adj() += res.adj() * b.val().transpose();
+    b.adj() += w_mat.val().transpose() * res.adj();
   }
-}
 
-template <typename T1, typename T2, typename Res,
-          require_var_matrix_t<T1>* = nullptr>
-void update_w(T1& w, int m, int n, std::vector<int, arena_allocator<int>>& u,
-              std::vector<int, arena_allocator<int>>& v, T2&& b, Res&& res) {
-  Eigen::Map<Eigen::SparseMatrix<double, Eigen::RowMajor>> w_mat(
-      m, n, w.size(), u.data(), v.data(), w.adj().data());
-  for (int k = 0; k < w_mat.outerSize(); ++k) {
-    for (Eigen::Map<Eigen::SparseMatrix<double, Eigen::RowMajor>>::InnerIterator
-             it(w_mat, k);
-         it; ++it) {
-      it.valueRef() += res.adj().coeff(it.row()) * value_of(b).coeff(it.col());
-    }
+  /**
+   * Overload for calculating adjoints of `w_mat`
+   * @tparam Result Either a type inheriting from `Eigen::DenseBase` with scalar
+   * type `var` or a `var<T>` where `T` inherits from `Eigen::DenseBase`
+   * @tparam WMat Either a type inheriting from `Eigen::DenseBase` with scalar
+   * type `var`. Or a `var<T>` where `T` inherits from `Eigen::SparseBase`
+   * @tparam B Either a type inheriting from `Eigen::DenseBase` with scalar type
+   * `double`
+   * @param res The vector result of the forward pass calculation
+   * @param w_mat A sparse matrix
+   * @param b A vector
+   */
+  template <typename Result, typename WMat, typename B,
+            require_rev_matrix_t<WMat>* = nullptr,
+            require_not_rev_matrix_t<B>* = nullptr>
+  inline void chain_internal(Result&& res, WMat&& w_mat, B&& b) {
+    w_mat.adj() += res.adj() * b.transpose();
   }
-}
 
+  /**
+   * Overload for calculating adjoints of `b`
+   * @tparam Result Either a type inheriting from `Eigen::DenseBase` with scalar
+   * type `var` or a `var<T>` where `T` inherits from `Eigen::DenseBase`
+   * @tparam WMat Either a type inheriting from `Eigen::DenseBase` with scalar
+   * type `double`
+   * @tparam B Either a type inheriting from `Eigen::DenseBase` with scalar type
+   * `var` or a `var<T>` where `T` inherits from `Eigen::DenseBase`
+   * @param res The vector result of the forward pass calculation
+   * @param w_mat A sparse matrix
+   * @param b A vector
+   */
+  template <typename Result, typename WMat, typename B,
+            require_not_rev_matrix_t<WMat>* = nullptr,
+            require_rev_matrix_t<B>* = nullptr>
+  inline void chain_internal(Result&& res, WMat&& w_mat, B&& b) {
+    b.adj() += w_mat.transpose() * res.adj();
+  }
+};
+
+/**
+ * Helper function to construct the csr_adjoint struct.
+ * @tparam Result_ Either a type inheriting from `Eigen::DenseBase` with scalar
+ * type `var` or a `var<T>` where `T` inherits from `Eigen::DenseBase`
+ * @tparam WMat_ Either a type inheriting from `Eigen::DenseBase` with scalar
+ * type `var` or `double`. Or a `var<T>` where `T` inherits from
+ * `Eigen::SparseBase`
+ * @tparam B_ Either a type inheriting from `Eigen::DenseBase` with scalar type
+ * `var` or `double`. Or a `var<T>` where `T` inherits from `Eigen::DenseBase`
+ *
+ * @param res The vector result of the forward pass calculation
+ * @param w_mat A sparse matrix
+ * @param b A vector
+ */
+template <typename Result_, typename WMat_, typename B_>
+inline void make_csr_adjoint(Result_&& res, WMat_&& w_mat, B_&& b) {
+  new csr_adjoint<std::decay_t<Result_>, std::decay_t<WMat_>, std::decay_t<B_>>(
+      std::forward<Result_>(res), std::forward<WMat_>(w_mat),
+      std::forward<B_>(b));
+  return;
+}
 }  // namespace internal
 
 /**
@@ -100,46 +180,29 @@ inline auto csr_matrix_times_vector(int m, int n, const T1& w,
   std::vector<int, arena_allocator<int>> u_arena(u.size());
   std::transform(u.begin(), u.end(), u_arena.begin(),
                  [](auto&& x) { return x - 1; });
+  using sparse_var_value_t
+      = var_value<Eigen::SparseMatrix<double, Eigen::RowMajor>>;
   if (!is_constant<T2>::value && !is_constant<T1>::value) {
     arena_t<promote_scalar_t<var, T2>> b_arena = b;
-    arena_t<promote_scalar_t<var, T1>> w_arena = to_arena(w);
-    auto w_val_arena = to_arena(value_of(w_arena));
-    sparse_val_mat w_val_mat(m, n, w_val_arena.size(), u_arena.data(),
-                             v_arena.data(), w_val_arena.data());
-    arena_t<return_t> res = w_val_mat * value_of(b_arena);
-    reverse_pass_callback(
-        [m, n, w_arena, w_val_arena, v_arena, u_arena, res, b_arena]() mutable {
-          sparse_val_mat w_val_mat(m, n, w_val_arena.size(), u_arena.data(),
-                                   v_arena.data(), w_val_arena.data());
-          internal::update_w(w_arena, m, n, u_arena, v_arena, b_arena, res);
-          b_arena.adj() += w_val_mat.transpose() * res.adj();
-        });
+    sparse_var_value_t w_mat_arena
+        = to_soa_sparse_matrix<Eigen::RowMajor>(m, n, w, u_arena, v_arena);
+    arena_t<return_t> res = w_mat_arena.val() * value_of(b_arena);
+    stan::math::internal::make_csr_adjoint(res, w_mat_arena, b_arena);
     return return_t(res);
   } else if (!is_constant<T2>::value) {
     arena_t<promote_scalar_t<var, T2>> b_arena = b;
     auto w_val_arena = to_arena(value_of(w));
     sparse_val_mat w_val_mat(m, n, w_val_arena.size(), u_arena.data(),
                              v_arena.data(), w_val_arena.data());
-
     arena_t<return_t> res = w_val_mat * value_of(b_arena);
-    reverse_pass_callback(
-        [m, n, w_val_arena, v_arena, u_arena, res, b_arena]() mutable {
-          sparse_val_mat w_val_mat(m, n, w_val_arena.size(), u_arena.data(),
-                                   v_arena.data(), w_val_arena.data());
-          b_arena.adj() += w_val_mat.transpose() * res.adj();
-        });
+    stan::math::internal::make_csr_adjoint(res, w_val_mat, b_arena);
     return return_t(res);
   } else {
-    arena_t<promote_scalar_t<var, T1>> w_arena = to_arena(w);
-    auto&& w_val = eval(value_of(w_arena));
-    sparse_val_mat w_val_mat(m, n, w_val.size(), u_arena.data(), v_arena.data(),
-                             w_val.data());
+    sparse_var_value_t w_mat_arena
+        = to_soa_sparse_matrix<Eigen::RowMajor>(m, n, w, u_arena, v_arena);
     auto b_arena = to_arena(value_of(b));
-    arena_t<return_t> res = w_val_mat * b_arena;
-    reverse_pass_callback(
-        [m, n, w_arena, v_arena, u_arena, res, b_arena]() mutable {
-          internal::update_w(w_arena, m, n, u_arena, v_arena, b_arena, res);
-        });
+    arena_t<return_t> res = w_mat_arena.val() * b_arena;
+    stan::math::internal::make_csr_adjoint(res, w_mat_arena, b_arena);
     return return_t(res);
   }
 }
diff --git a/stan/math/rev/fun/fill.hpp b/stan/math/rev/fun/fill.hpp
index 2445c354537..703a2c657b6 100644
--- a/stan/math/rev/fun/fill.hpp
+++ b/stan/math/rev/fun/fill.hpp
@@ -23,7 +23,7 @@ namespace math {
 template <typename VarMat, typename S, require_var_matrix_t<VarMat>* = nullptr,
           require_var_t<S>* = nullptr>
 inline void fill(VarMat& x, const S& y) {
-  arena_t<plain_type_t<value_type_t<VarMat>>> prev_vals = x.val().eval();
+  arena_t<plain_type_t<value_type_t<VarMat>>> prev_vals(x.val().eval());
   x.vi_->val_.fill(y.val());
   reverse_pass_callback([x, y, prev_vals]() mutable {
     x.vi_->val_ = prev_vals;
@@ -46,7 +46,7 @@ inline void fill(VarMat& x, const S& y) {
 template <typename VarMat, typename S, require_var_matrix_t<VarMat>* = nullptr,
           require_arithmetic_t<S>* = nullptr>
 inline void fill(VarMat& x, const S& y) {
-  arena_t<plain_type_t<value_type_t<VarMat>>> prev_vals = x.val().eval();
+  arena_t<plain_type_t<value_type_t<VarMat>>> prev_vals(x.val().eval());
   x.vi_->val_.fill(y);
   reverse_pass_callback([x, prev_vals]() mutable {
     x.vi_->val_ = prev_vals;
diff --git a/stan/math/rev/fun/multiply.hpp b/stan/math/rev/fun/multiply.hpp
index 6851952a721..a2c1348896a 100644
--- a/stan/math/rev/fun/multiply.hpp
+++ b/stan/math/rev/fun/multiply.hpp
@@ -26,11 +26,11 @@ namespace math {
 template <typename T1, typename T2, require_all_matrix_t<T1, T2>* = nullptr,
           require_return_type_t<is_var, T1, T2>* = nullptr,
           require_not_row_and_col_vector_t<T1, T2>* = nullptr>
-inline auto multiply(const T1& A, const T2& B) {
+inline auto multiply(T1&& A, T2&& B) {
   check_multiplicable("multiply", "A", A, "B", B);
   if (!is_constant<T2>::value && !is_constant<T1>::value) {
-    arena_t<promote_scalar_t<var, T1>> arena_A = A;
-    arena_t<promote_scalar_t<var, T2>> arena_B = B;
+    arena_t<promote_scalar_t<var, T1>> arena_A(std::forward<T1>(A));
+    arena_t<promote_scalar_t<var, T2>> arena_B(std::forward<T2>(B));
     auto arena_A_val = to_arena(arena_A.val());
     auto arena_B_val = to_arena(arena_B.val());
     using return_t
@@ -48,19 +48,19 @@ inline auto multiply(const T1& A, const T2& B) {
             arena_B.adj() += arena_A_val.transpose() * res_adj;
           }
         });
-    return return_t(res);
+    return res;
   } else if (!is_constant<T2>::value) {
     arena_t<promote_scalar_t<double, T1>> arena_A = value_of(A);
-    arena_t<promote_scalar_t<var, T2>> arena_B = B;
+    arena_t<promote_scalar_t<var, T2>> arena_B(std::forward<T2>(B));
     using return_t
         = return_var_matrix_t<decltype(arena_A * value_of(B).eval()), T1, T2>;
     arena_t<return_t> res = arena_A * arena_B.val_op();
     reverse_pass_callback([arena_B, arena_A, res]() mutable {
       arena_B.adj() += arena_A.transpose() * res.adj_op();
     });
-    return return_t(res);
+    return res;
   } else {
-    arena_t<promote_scalar_t<var, T1>> arena_A = A;
+    arena_t<promote_scalar_t<var, T1>> arena_A(std::forward<T1>(A));
     arena_t<promote_scalar_t<double, T2>> arena_B = value_of(B);
     using return_t
         = return_var_matrix_t<decltype(value_of(arena_A).eval() * arena_B), T1,
@@ -70,7 +70,7 @@ inline auto multiply(const T1& A, const T2& B) {
       arena_A.adj() += res.adj_op() * arena_B.transpose();
     });
 
-    return return_t(res);
+    return res;
   }
 }
 
@@ -129,7 +129,7 @@ inline var multiply(const T1& A, const T2& B) {
  * @tparam T1 type of the scalar
  * @tparam T2 type of the matrix or expression
  *
- * @param A scalar
+ * @param a scalar
  * @param B matrix
  * @return product of matrix and scalar
  */
@@ -137,41 +137,41 @@ template <typename T1, typename T2, require_not_matrix_t<T1>* = nullptr,
           require_matrix_t<T2>* = nullptr,
           require_return_type_t<is_var, T1, T2>* = nullptr,
           require_not_row_and_col_vector_t<T1, T2>* = nullptr>
-inline auto multiply(const T1& A, const T2& B) {
+inline auto multiply(const T1& a, T2&& B) {
   if (!is_constant<T2>::value && !is_constant<T1>::value) {
-    arena_t<promote_scalar_t<var, T1>> arena_A = A;
-    arena_t<promote_scalar_t<var, T2>> arena_B = B;
+    arena_t<promote_scalar_t<var, T2>> arena_B(std::forward<T2>(B));
     using return_t = return_var_matrix_t<T2, T1, T2>;
-    arena_t<return_t> res = arena_A.val() * arena_B.val().array();
-    reverse_pass_callback([arena_A, arena_B, res]() mutable {
-      const auto a_val = arena_A.val();
+    var av = a;
+    auto a_val = value_of(av);
+    arena_t<return_t> res = a_val * arena_B.val().array();
+    reverse_pass_callback([av, a_val, arena_B, res]() mutable {
       for (Eigen::Index j = 0; j < res.cols(); ++j) {
         for (Eigen::Index i = 0; i < res.rows(); ++i) {
           const auto res_adj = res.adj().coeffRef(i, j);
-          arena_A.adj() += res_adj * arena_B.val().coeff(i, j);
+          av.adj() += res_adj * arena_B.val().coeff(i, j);
           arena_B.adj().coeffRef(i, j) += a_val * res_adj;
         }
       }
     });
-    return return_t(res);
+    return res;
   } else if (!is_constant<T2>::value) {
-    arena_t<promote_scalar_t<double, T1>> arena_A = value_of(A);
-    arena_t<promote_scalar_t<var, T2>> arena_B = B;
+    double val_a = value_of(a);
+    arena_t<promote_scalar_t<var, T2>> arena_B(std::forward<T2>(B));
     using return_t = return_var_matrix_t<T2, T1, T2>;
-    arena_t<return_t> res = arena_A * arena_B.val().array();
-    reverse_pass_callback([arena_A, arena_B, res]() mutable {
-      arena_B.adj().array() += arena_A * res.adj().array();
+    arena_t<return_t> res = val_a * arena_B.val().array();
+    reverse_pass_callback([val_a, arena_B, res]() mutable {
+      arena_B.adj().array() += val_a * res.adj().array();
     });
-    return return_t(res);
+    return res;
   } else {
-    arena_t<promote_scalar_t<var, T1>> arena_A = A;
+    var av = a;
     arena_t<promote_scalar_t<double, T2>> arena_B = value_of(B);
     using return_t = return_var_matrix_t<T2, T1, T2>;
-    arena_t<return_t> res = arena_A.val() * arena_B.array();
-    reverse_pass_callback([arena_A, arena_B, res]() mutable {
-      arena_A.adj() += (res.adj().array() * arena_B.array()).sum();
+    arena_t<return_t> res = av.val() * arena_B.array();
+    reverse_pass_callback([av, arena_B, res]() mutable {
+      av.adj() += (res.adj().array() * arena_B.array()).sum();
     });
-    return return_t(res);
+    return res;
   }
 }
 
@@ -192,8 +192,8 @@ template <typename T1, typename T2, require_matrix_t<T1>* = nullptr,
           require_not_complex_t<value_type_t<T1>>* = nullptr,
           require_not_complex_t<value_type_t<T2>>* = nullptr,
           require_not_row_and_col_vector_t<T1, T2>* = nullptr>
-inline auto multiply(const T1& A, const T2& B) {
-  return multiply(B, A);
+inline auto multiply(T1&& A, T2&& B) {
+  return multiply(std::forward<T2>(B), std::forward<T1>(A));
 }
 
 /**
@@ -207,8 +207,8 @@ inline auto multiply(const T1& A, const T2& B) {
  * @param b The right hand side of the multiplication
  */
 template <typename T1, typename T2, require_any_var_matrix_t<T1, T2>* = nullptr>
-inline auto operator*(const T1& a, const T2& b) {
-  return multiply(a, b);
+inline auto operator*(T1&& a, T2&& b) {
+  return multiply(std::forward<T1>(a), std::forward<T2>(b));
 }
 
 }  // namespace math
diff --git a/stan/math/rev/fun/sum.hpp b/stan/math/rev/fun/sum.hpp
index 832ce2c8719..9f4ba90ec5b 100644
--- a/stan/math/rev/fun/sum.hpp
+++ b/stan/math/rev/fun/sum.hpp
@@ -44,8 +44,8 @@ inline var sum(const std::vector<var, Alloc>& m) {
  * @return Sum of coefficients of matrix.
  */
 template <typename T, require_rev_matrix_t<T>* = nullptr>
-inline var sum(const T& x) {
-  arena_t<T> x_arena = x;
+inline var sum(T&& x) {
+  arena_t<T> x_arena(std::forward<T>(x));
   return make_callback_var(sum(x_arena.val()), [x_arena](auto& vi) mutable {
     x_arena.adj().array() += vi.adj();
   });
diff --git a/stan/math/rev/fun/to_soa_sparse_matrix.hpp b/stan/math/rev/fun/to_soa_sparse_matrix.hpp
new file mode 100644
index 00000000000..b5e872850a1
--- /dev/null
+++ b/stan/math/rev/fun/to_soa_sparse_matrix.hpp
@@ -0,0 +1,125 @@
+#ifndef STAN_MATH_REV_FUN_TO_SOA_SPARSE_MATRIX_HPP
+#define STAN_MATH_REV_FUN_TO_SOA_SPARSE_MATRIX_HPP
+
+#include <stan/math/prim/fun/Eigen.hpp>
+#include <stan/math/rev/core.hpp>
+#include <stan/math/rev/meta.hpp>
+#include <stan/math/prim/meta.hpp>
+#include <type_traits>
+
+namespace stan {
+namespace math {
+
+/**
+ * Create a sparse matrix from the given SoA matrix and indexes.
+ * @tparam Options Eigen matrix options.
+ * @tparam VarMatrix A @ref var_value with a dense vector inner type
+ * @tparam Vec1 Container type of the column indexes.
+ * @tparam Vec2 Container type of the row indexes.
+ * @param m Number of rows in matrix.
+ * @param n Number of columns in matrix.
+ * @param w Vector of non-zero values in matrix.
+ * @param u Index of where each row starts in w, length equal to
+ *          the number of rows plus one.
+ * @param v Column index of each non-zero value, same
+ *          length as w.
+ * @return Sparse matrix.
+ */
+template <int Options = Eigen::ColMajor, typename VarMatrix, typename Vec1,
+          typename Vec2, require_var_t<VarMatrix>* = nullptr,
+          require_eigen_dense_base_t<value_type_t<VarMatrix>>* = nullptr,
+          require_all_std_vector_vt<std::is_integral, Vec1, Vec2>* = nullptr>
+inline auto to_soa_sparse_matrix(int m, int n, VarMatrix&& w, Vec1&& u,
+                                 Vec2&& v) {
+  auto u_arena = to_arena(std::forward<Vec1>(u));
+  auto v_arena = to_arena(std::forward<Vec2>(v));
+  using sparse_mat_t = Eigen::SparseMatrix<double, Options>;
+  using sparse_arena_mat_t = arena_t<sparse_mat_t>;
+  sparse_arena_mat_t arena_val_x(m, n, w.val().size(), u_arena.data(),
+                                 v_arena.data(), w.vi_->val_.data());
+  sparse_arena_mat_t arena_adj_x(m, n, w.adj().size(), u_arena.data(),
+                                 v_arena.data(), w.vi_->adj_.data());
+  var_value<sparse_mat_t> var_x(arena_val_x, arena_adj_x);
+  return var_x;
+}
+
+/**
+ * Create a sparse matrix from the given AoS matrix of vars and indexes.
+ * @tparam Options Eigen matrix options.
+ * @tparam MatrixVar A type inheriting from `Eigen::DenseBase` with a scalar
+ * type of @ref var_value
+ * @tparam Vec1 Container type of the column indexes.
+ * @tparam Vec2 Container type of the row indexes.
+ * @param m Number of rows in matrix.
+ * @param n Number of columns in matrix.
+ * @param w Vector of non-zero values in matrix.
+ * @param u Index of where each row starts in w, length equal to
+ *          the number of rows plus one.
+ * @param v Column index of each non-zero value, same
+ *          length as w.
+ * @return Sparse matrix.
+ */
+template <int Options = Eigen::ColMajor, typename MatrixVar, typename Vec1,
+          typename Vec2,
+          require_eigen_dense_base_vt<is_var, MatrixVar>* = nullptr,
+          require_all_std_vector_vt<std::is_integral, Vec1, Vec2>* = nullptr>
+inline auto to_soa_sparse_matrix(int m, int n, MatrixVar&& w, Vec1&& u,
+                                 Vec2&& v) {
+  auto w_arena = to_arena(std::forward<MatrixVar>(w));
+  auto u_arena = to_arena(std::forward<Vec1>(u));
+  auto v_arena = to_arena(std::forward<Vec2>(v));
+  arena_t<Eigen::SparseMatrix<var, Options>> arena_x(
+      m, n, w_arena.size(), u_arena.data(), v_arena.data(), w_arena.data());
+  var_value<Eigen::SparseMatrix<double, Options>> var_x(value_of(arena_x));
+  // No need to copy adj, but need to backprop
+  reverse_pass_callback([arena_x, var_x]() mutable {
+    using var_sparse_iterator_t =
+        typename arena_t<Eigen::SparseMatrix<var, Options>>::InnerIterator;
+    using dbl_sparse_iterator_t =
+        typename arena_t<Eigen::SparseMatrix<double, Options>>::InnerIterator;
+    // arena_x.adj() += var_x.adj() once custom adj() for var sparse matrix
+    for (int k = 0; k < arena_x.outerSize(); ++k) {
+      var_sparse_iterator_t it_arena_x(arena_x, k);
+      dbl_sparse_iterator_t it_var_x(var_x.adj(), k);
+      for (; static_cast<bool>(it_arena_x) && static_cast<bool>(it_var_x);
+           ++it_arena_x, ++it_var_x) {
+        it_arena_x.valueRef().adj() += it_var_x.valueRef();
+      }
+    }
+  });
+  return var_x;
+}
+
+/**
+ * Create a sparse matrix from the given matrix of floats and indexes.
+ * @tparam Options Eigen matrix options.
+ * @tparam Mat A type inheriting from `Eigen::DenseBase` with an arithmetic
+ * scalar type
+ * @tparam Vec1 Container type of the column indexes.
+ * @tparam Vec2 Container type of the row indexes.
+ * @param m Number of rows in matrix.
+ * @param n Number of columns in matrix.
+ * @param w Vector of non-zero values in matrix.
+ * @param u Index of where each row starts in w, length equal to
+ *          the number of rows plus one.
+ * @param v Column index of each non-zero value, same
+ *          length as w.
+ * @return Sparse matrix.
+ */
+template <int Options = Eigen::ColMajor, typename Mat, typename Vec1,
+          typename Vec2,
+          require_eigen_dense_base_vt<std::is_arithmetic, Mat>* = nullptr,
+          require_all_std_vector_vt<std::is_integral, Vec1, Vec2>* = nullptr>
+inline auto to_soa_sparse_matrix(int m, int n, Mat&& w, Vec1&& u, Vec2&& v) {
+  auto w_arena = to_arena(std::forward<Mat>(w));
+  auto u_arena = to_arena(std::forward<Vec1>(u));
+  auto v_arena = to_arena(std::forward<Vec2>(v));
+  arena_t<Eigen::SparseMatrix<double, Options>> arena_x(
+      m, n, w_arena.size(), u_arena.data(), v_arena.data(), w_arena.data());
+  return var_value<Eigen::SparseMatrix<double, Options>>(arena_x);
+}
+
+}  // namespace math
+}  // namespace stan
+
+#endif
diff --git a/stan/math/rev/fun/to_var_value.hpp b/stan/math/rev/fun/to_var_value.hpp
index 004b520b6f2..4b93cf1e6e6 100644
--- a/stan/math/rev/fun/to_var_value.hpp
+++ b/stan/math/rev/fun/to_var_value.hpp
@@ -18,7 +18,8 @@ namespace math {
  * @param a matrix to convert
  */
 template <typename T, require_eigen_vt<is_var, T>* = nullptr>
-var_value<Eigen::Matrix<double, T::RowsAtCompileTime, T::ColsAtCompileTime>>
+inline var_value<
+    Eigen::Matrix<double, T::RowsAtCompileTime, T::ColsAtCompileTime>>
 to_var_value(const T& a) {
   arena_matrix<plain_type_t<T>> a_arena = a;
   var_value<promote_scalar_t<double, T>> res(a_arena.val());
@@ -34,7 +35,7 @@ to_var_value(const T& a) {
  * @param a matrix to convert
  */
 template <typename T, require_var_t<T>* = nullptr>
-T to_var_value(T&& a) {
+inline T to_var_value(T&& a) {
   return std::forward<T>(a);
 }
 
@@ -46,7 +47,7 @@ T to_var_value(T&& a) {
  * @param a std::vector of elements to convert
  */
 template <typename T>
-auto to_var_value(const std::vector<T>& a) {
+inline auto to_var_value(const std::vector<T>& a) {
   std::vector<decltype(to_var_value(std::declval<T>()))> out;
   out.reserve(a.size());
   for (size_t i = 0; i < a.size(); ++i) {
diff --git a/test/unit/math/mix/fun/csr_matrix_times_vector_test.cpp b/test/unit/math/mix/fun/csr_matrix_times_vector_test.cpp
index 20c73955243..d17d1860fc3 100644
--- a/test/unit/math/mix/fun/csr_matrix_times_vector_test.cpp
+++ b/test/unit/math/mix/fun/csr_matrix_times_vector_test.cpp
@@ -1,7 +1,27 @@
 #include <test/unit/math/test_ad.hpp>
 #include <vector>
 
-TEST(MathMixMatFun, csr_matrix_times_vector) {
+TEST(MathMixMatFun, csr_matrix_times_vector_vals) {
+  using stan::math::csr_matrix_times_vector;
+  std::vector<int> v{1, 2, 3, 1, 2};
+  std::vector<int> u{1, 2, 3, 4, 5, 6};
+  Eigen::VectorXd b(5);
+  b << 1, 2, 3, 4, 5;
+  Eigen::VectorXd w(5);
+  w << -0.67082, 0.5, -0.223607, -0.223607, -0.5;
+  auto dbl_res = csr_matrix_times_vector(5, 5, w, v, u, b);
+  using stan::math::var;
+  Eigen::Matrix<var, -1, 1> b_var(b);
+  Eigen::Matrix<var, -1, 1> w_var(w);
+  auto var_res_w = csr_matrix_times_vector(5, 5, w_var, v, u, b);
+  EXPECT_MATRIX_EQ(dbl_res, var_res_w);
+  auto var_res_b = csr_matrix_times_vector(5, 5, w, v, u, b_var);
+  EXPECT_MATRIX_EQ(dbl_res, var_res_b);
+  auto var_res_bw = csr_matrix_times_vector(5, 5, w_var, v, u, b_var);
+  EXPECT_MATRIX_EQ(dbl_res, var_res_bw);
+}
+
+TEST(MathMixMatFun, csr_matrix_times_vector1) {
   auto f = [](const auto& w, const auto& b) {
     using stan::math::csr_matrix_times_vector;
     std::vector<int> v{1, 2, 3, 1, 2};
@@ -15,5 +35,20 @@ TEST(MathMixMatFun, csr_matrix_times_vector) {
   b << 1, 2, 3, 4, 5;
 
   stan::test::expect_ad(f, w, b);
+}
+
+TEST(MathMixMatFun, csr_matrix_times_vector2) {
+  auto f = [](const auto& w, const auto& b) {
+    using stan::math::csr_matrix_times_vector;
+    std::vector<int> v{1, 2, 3, 1, 2};
+    std::vector<int> u{1, 2, 3, 4, 5, 6};
+    return csr_matrix_times_vector(5, 5, w, v, u, b);
+  };
+
+  Eigen::VectorXd w(5);
+  w << -0.67082, 0.5, -0.223607, -0.223607, -0.5;
+  Eigen::VectorXd b(5);
+  b << 1, 2, 3, 4, 5;
+
   stan::test::expect_ad_matvar(f, w, b);
 }
diff --git a/test/unit/math/mix/functor/reduce_sum_part1_test.cpp b/test/unit/math/mix/functor/reduce_sum_part1_test.cpp
index abf7bc184f3..ad219f26182 100644
--- a/test/unit/math/mix/functor/reduce_sum_part1_test.cpp
+++ b/test/unit/math/mix/functor/reduce_sum_part1_test.cpp
@@ -1,14 +1,14 @@
 #include <stan/math/prim/meta.hpp>
 #include <test/unit/math/test_ad.hpp>
 #include <test/unit/math/mix/functor/reduce_sum_util.hpp>
-
+#include <test/unit/math/rev/util.hpp>
 #include <limits>
 #include <vector>
 
 // Reduce sum tests are broken up into four files to avoid windows compiler
 // error
 
-TEST(MathMix_reduce_sum, grainsize_static) {
+TEST_F(AgradRev, reduce_sum_grainsize_static) {
   using stan::math::test::get_new_msg;
   using stan::math::test::sum_lpdf;
 
@@ -33,7 +33,7 @@ TEST(MathMix_reduce_sum, grainsize_static) {
   stan::test::expect_ad(f4, data);
 }
 
-TEST(MathMix_reduce_sum, grainsize) {
+TEST_F(AgradRev, reduce_sum_grainsize) {
   using stan::math::test::get_new_msg;
   using stan::math::test::sum_lpdf;
   auto f1 = [](auto&& data) {
@@ -57,7 +57,7 @@ TEST(MathMix_reduce_sum, grainsize) {
   stan::test::expect_ad(f4, data);
 }
 
-TEST(MathMix_reduce_sum, std_vector_zero_length) {
+TEST_F(AgradRev, reduce_sum_std_vector_zero_length) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
 
@@ -67,7 +67,7 @@ TEST(MathMix_reduce_sum, std_vector_zero_length) {
   stan::test::expect_ad(reduce_sum_sum_lpdf, data);
 }
 
-TEST(MathMix_reduce_sum, std_vector_double_slice) {
+TEST_F(AgradRev, reduce_sum_std_vector_double_slice) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
 
@@ -77,7 +77,7 @@ TEST(MathMix_reduce_sum, std_vector_double_slice) {
   stan::test::expect_ad(reduce_sum_sum_lpdf, data);
 }
 
-TEST(MathMix_reduce_sum, std_vector_std_vector_double_slice) {
+TEST_F(AgradRev, reduce_sum_std_vector_std_vector_double_slice) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
 
@@ -87,7 +87,7 @@ TEST(MathMix_reduce_sum, std_vector_std_vector_double_slice) {
   stan::test::expect_ad(reduce_sum_sum_lpdf, data);
 }
 
-TEST(MathMix_reduce_sum, std_vector_eigen_vector_double_slice) {
+TEST_F(AgradRev, reduce_sum_std_vector_eigen_vector_double_slice) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
 
@@ -97,7 +97,7 @@ TEST(MathMix_reduce_sum, std_vector_eigen_vector_double_slice) {
   stan::test::expect_ad(reduce_sum_sum_lpdf, data);
 }
 
-TEST(MathMix_reduce_sum, std_vector_eigen_row_vector_double_slice) {
+TEST_F(AgradRev, reduce_sum_std_vector_eigen_row_vector_double_slice) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
 
@@ -107,7 +107,7 @@ TEST(MathMix_reduce_sum, std_vector_eigen_row_vector_double_slice) {
   stan::test::expect_ad(reduce_sum_sum_lpdf, data);
 }
 
-TEST(MathMix_reduce_sum, std_vector_eigen_matrix_double_slice) {
+TEST_F(AgradRev, reduce_sum_std_vector_eigen_matrix_double_slice) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
 
@@ -117,7 +117,7 @@ TEST(MathMix_reduce_sum, std_vector_eigen_matrix_double_slice) {
   stan::test::expect_ad(reduce_sum_sum_lpdf, data);
 }
 
-TEST(MathMix_reduce_sum, std_vector_std_vector_std_vector_double_slice) {
+TEST_F(AgradRev, reduce_sum_std_vector_std_vector_std_vector_double_slice) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
 
@@ -128,7 +128,7 @@ TEST(MathMix_reduce_sum, std_vector_std_vector_std_vector_double_slice) {
   stan::test::expect_ad(reduce_sum_sum_lpdf, data);
 }
 
-TEST(MathMix_reduce_sum, std_vector_std_vector_eigen_vector_double_slice) {
+TEST_F(AgradRev, reduce_sum_std_vector_std_vector_eigen_vector_double_slice) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
 
@@ -139,7 +139,8 @@ TEST(MathMix_reduce_sum, std_vector_std_vector_eigen_vector_double_slice) {
   stan::test::expect_ad(reduce_sum_sum_lpdf, data);
 }
 
-TEST(MathMix_reduce_sum, std_vector_std_vector_eigen_row_vector_double_slice) {
+TEST_F(AgradRev,
+       reduce_sum_std_vector_std_vector_eigen_row_vector_double_slice) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
 
@@ -150,7 +151,7 @@ TEST(MathMix_reduce_sum, std_vector_std_vector_eigen_row_vector_double_slice) {
   stan::test::expect_ad(reduce_sum_sum_lpdf, data);
 }
 
-TEST(MathMix_reduce_sum, std_vector_std_vector_eigen_matrix_double_slice) {
+TEST_F(AgradRev, reduce_sum_std_vector_std_vector_eigen_matrix_double_slice) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
 
@@ -180,7 +181,7 @@ TEST(StanMath_reduce_sum_static, start_end_slice) {
   stan::test::expect_ad(start_end_static, data);
 }
 
-TEST(MathMix_reduce_sum, int_arg) {
+TEST_F(AgradRev, reduce_sum_int_arg) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
   std::vector<double> data(2, 1.0);
@@ -192,7 +193,7 @@ TEST(MathMix_reduce_sum, int_arg) {
       [&](auto&& data) { return reduce_sum_sum_lpdf(data, arg); }, data);
 }
 
-TEST(MathMix_reduce_sum, std_vector_int_arg) {
+TEST_F(AgradRev, reduce_sum_std_vector_int_arg) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
   std::vector<double> data(2, 10.0);
@@ -204,12 +205,12 @@ TEST(MathMix_reduce_sum, std_vector_int_arg) {
       [&](auto&& data) { return reduce_sum_sum_lpdf(data, arg); }, data);
 }
 
-TEST(MathMix_reduce_sum, double_arg) {
+TEST_F(AgradRev, reduce_sum_double_arg) {
   stan::math::test::expect_ad_reduce_sum_lpdf(std::vector<double>(2, 10.0),
                                               5.0);
 }
 
-TEST(MathMix_reduce_sum, std_vector_double_arg) {
+TEST_F(AgradRev, reduce_sum_std_vector_double_arg) {
   stan::math::test::expect_ad_reduce_sum_lpdf(std::vector<double>(2, 10.0),
                                               std::vector<double>(2, 10.0));
 }
diff --git a/test/unit/math/mix/functor/reduce_sum_part2_test.cpp b/test/unit/math/mix/functor/reduce_sum_part2_test.cpp
index 524671b3223..16a9c7b4b2d 100644
--- a/test/unit/math/mix/functor/reduce_sum_part2_test.cpp
+++ b/test/unit/math/mix/functor/reduce_sum_part2_test.cpp
@@ -1,6 +1,7 @@
 #include <stan/math/prim/meta.hpp>
 #include <test/unit/math/test_ad.hpp>
 #include <test/unit/math/mix/functor/reduce_sum_util.hpp>
+#include <test/unit/math/rev/util.hpp>
 
 #include <limits>
 #include <vector>
@@ -8,41 +9,41 @@
 // Reduce sum tests are broken up into four files to avoid windows compiler
 // error
 
-TEST(MathMix_reduce_sum, eigen_vector_arg) {
+TEST_F(AgradRev, reduce_sum_eigen_vector_arg) {
   std::vector<double> data(2, 10.0);
   Eigen::VectorXd arg = Eigen::VectorXd::Ones(2);
   stan::math::test::expect_ad_reduce_sum_lpdf(data, arg);
 }
 
-TEST(MathMix_reduce_sum, eigen_row_vector_arg) {
+TEST_F(AgradRev, reduce_sum_eigen_row_vector_arg) {
   std::vector<double> data(2, 10.0);
   Eigen::RowVectorXd arg = Eigen::RowVectorXd::Ones(2);
 
   stan::math::test::expect_ad_reduce_sum_lpdf(data, arg);
 }
 
-TEST(MathMix_reduce_sum, eigen_matrix_arg) {
+TEST_F(AgradRev, reduce_sum_eigen_matrix_arg) {
   std::vector<double> data(2, 10.0);
   Eigen::MatrixXd arg = Eigen::MatrixXd::Ones(2, 2);
 
   stan::math::test::expect_ad_reduce_sum_lpdf(data, arg);
 }
 
-TEST(MathMix_reduce_sum, std_vector_std_vector_double_arg) {
+TEST_F(AgradRev, reduce_sum_std_vector_std_vector_double_arg) {
   std::vector<double> data(2, 10.0);
   std::vector<std::vector<double>> arg(2, std::vector<double>(2, 10.0));
 
   stan::math::test::expect_ad_reduce_sum_lpdf(data, arg);
 }
 
-TEST(MathMix_reduce_sum, std_vector_eigen_vector_arg) {
+TEST_F(AgradRev, reduce_sum_std_vector_eigen_vector_arg) {
   std::vector<double> data(2, 10.0);
   std::vector<Eigen::VectorXd> arg(2, Eigen::VectorXd::Ones(2));
 
   stan::math::test::expect_ad_reduce_sum_lpdf(data, arg);
 }
 
-TEST(MathMix_reduce_sum, std_vector_eigen_row_vector_arg) {
+TEST_F(AgradRev, reduce_sum_std_vector_eigen_row_vector_arg) {
   std::vector<double> data(2, 10.0);
   std::vector<Eigen::RowVectorXd> arg(2, Eigen::RowVectorXd::Ones(2));
 
diff --git a/test/unit/math/mix/functor/reduce_sum_part3_test.cpp b/test/unit/math/mix/functor/reduce_sum_part3_test.cpp
index 52723cdeee3..1999ce0d871 100644
--- a/test/unit/math/mix/functor/reduce_sum_part3_test.cpp
+++ b/test/unit/math/mix/functor/reduce_sum_part3_test.cpp
@@ -1,6 +1,7 @@
 #include <stan/math/prim/meta.hpp>
 #include <test/unit/math/test_ad.hpp>
 #include <test/unit/math/mix/functor/reduce_sum_util.hpp>
+#include <test/unit/math/rev/util.hpp>
 
 #include <limits>
 #include <vector>
@@ -8,7 +9,7 @@
 // Reduce sum tests are broken up into four files to avoid windows compiler
 // error
 
-TEST(MathMix_reduce_sum, eigen_three_args1) {
+TEST_F(AgradRev, reduce_sum_eigen_three_args1) {
   using stan::math::test::reduce_sum_int_sum_lpdf;
   using stan::math::test::reduce_sum_static_int_sum_lpdf;
   Eigen::VectorXd arg1 = Eigen::VectorXd::Ones(2);
@@ -19,7 +20,7 @@ TEST(MathMix_reduce_sum, eigen_three_args1) {
   stan::test::expect_ad(reduce_sum_int_sum_lpdf, arg1, arg2, arg3);
 }
 
-TEST(MathMix_reduce_sum, eigen_three_args2) {
+TEST_F(AgradRev, reduce_sum_eigen_three_args2) {
   using stan::math::test::reduce_sum_int_sum_lpdf;
   using stan::math::test::reduce_sum_static_int_sum_lpdf;
   double arg1 = 1.0;
@@ -30,7 +31,7 @@ TEST(MathMix_reduce_sum, eigen_three_args2) {
   stan::test::expect_ad(reduce_sum_int_sum_lpdf, arg1, arg2, arg3);
 }
 
-TEST(MathMix_reduce_sum, eigen_three_args3) {
+TEST_F(AgradRev, reduce_sum_eigen_three_args3) {
   using stan::math::test::reduce_sum_int_sum_lpdf;
   using stan::math::test::reduce_sum_static_int_sum_lpdf;
   double arg1 = 1.0;
@@ -41,7 +42,7 @@ TEST(MathMix_reduce_sum, eigen_three_args3) {
   stan::test::expect_ad(reduce_sum_int_sum_lpdf, arg1, arg2, arg3);
 }
 
-TEST(MathMix_reduce_sum, eigen_three_args_with_ints1) {
+TEST_F(AgradRev, reduce_sum_eigen_three_args_with_ints1) {
   using stan::math::test::reduce_sum_int_sum_lpdf;
   using stan::math::test::reduce_sum_static_int_sum_lpdf;
   Eigen::VectorXd arg1 = Eigen::VectorXd::Ones(2);
@@ -63,7 +64,7 @@ TEST(MathMix_reduce_sum, eigen_three_args_with_ints1) {
       arg1, arg2, arg3);
 }
 
-TEST(MathMix_reduce_sum, eigen_three_args_with_ints2) {
+TEST_F(AgradRev, reduce_sum_eigen_three_args_with_ints2) {
   using stan::math::test::reduce_sum_int_sum_lpdf;
   using stan::math::test::reduce_sum_static_int_sum_lpdf;
   double arg1 = 1.0;
diff --git a/test/unit/math/mix/functor/reduce_sum_part4_test.cpp b/test/unit/math/mix/functor/reduce_sum_part4_test.cpp
index e2cfead9893..95d7ccf2fa7 100644
--- a/test/unit/math/mix/functor/reduce_sum_part4_test.cpp
+++ b/test/unit/math/mix/functor/reduce_sum_part4_test.cpp
@@ -1,6 +1,7 @@
 #include <stan/math/prim/meta.hpp>
 #include <test/unit/math/test_ad.hpp>
 #include <test/unit/math/mix/functor/reduce_sum_util.hpp>
+#include <test/unit/math/rev/util.hpp>
 
 #include <limits>
 #include <vector>
@@ -8,7 +9,7 @@
 // Reduce sum tests are broken up into four files to avoid windows compiler
 // error
 
-TEST(MathMix_reduce_sum, eigen_three_args_with_ints3) {
+TEST_F(AgradRev, reduce_sum_eigen_three_args_with_ints3) {
   using stan::math::test::reduce_sum_int_sum_lpdf;
   using stan::math::test::reduce_sum_static_int_sum_lpdf;
   double arg1 = 1.0;
@@ -30,7 +31,7 @@ TEST(MathMix_reduce_sum, eigen_three_args_with_ints3) {
       arg1, arg2, arg3);
 }
 
-TEST(MathMix_reduce_sum, eigen_three_args_with_doubles1) {
+TEST_F(AgradRev, reduce_sum_eigen_three_args_with_doubles1) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
   Eigen::VectorXd arg1 = Eigen::VectorXd::Ones(2);
@@ -53,7 +54,7 @@ TEST(MathMix_reduce_sum, eigen_three_args_with_doubles1) {
       arg1, arg2, arg3);
 }
 
-TEST(MathMix_reduce_sum, eigen_three_args_with_doubles2) {
+TEST_F(AgradRev, reduce_sum_eigen_three_args_with_doubles2) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
   double arg1 = 1.0;
@@ -77,7 +78,7 @@ TEST(MathMix_reduce_sum, eigen_three_args_with_doubles2) {
       arg1, arg2, arg3);
 }
 
-TEST(MathMix_reduce_sum, eigen_three_args_with_doubles3) {
+TEST_F(AgradRev, reduce_sum_eigen_three_args_with_doubles3) {
   using stan::math::test::reduce_sum_static_sum_lpdf;
   using stan::math::test::reduce_sum_sum_lpdf;
   double arg1 = 1.0;
@@ -102,7 +103,7 @@ TEST(MathMix_reduce_sum, eigen_three_args_with_doubles3) {
 }
 
 #ifdef STAN_THREADS
-TEST(MathMix_reduce_sum, static_check) {
+TEST_F(AgradRev, reduce_sum_static_check) {
   using stan::math::test::get_new_msg;
   using stan::math::test::static_check_lpdf;
 
diff --git a/test/unit/math/mix/prob/bernoulli_logit_glm_lpmf_test.cpp b/test/unit/math/mix/prob/bernoulli_logit_glm_lpmf_test.cpp
index 430ff1a4769..fd29b24989e 100644
--- a/test/unit/math/mix/prob/bernoulli_logit_glm_lpmf_test.cpp
+++ b/test/unit/math/mix/prob/bernoulli_logit_glm_lpmf_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, bernoulli_logit_glm_lpmf) {
+TEST_F(AgradRev, mathMixScalFun_bernoulli_logit_glm_lpmf) {
   auto f = [](const auto y) {
     return [=](const auto& x, const auto& alpha, const auto& beta) {
       return stan::math::bernoulli_logit_glm_lpmf(y, x, alpha, beta);
diff --git a/test/unit/math/mix/prob/categorical_logit_glm_lpmf_test.cpp b/test/unit/math/mix/prob/categorical_logit_glm_lpmf_test.cpp
index 084a92fc166..68de98a2cd8 100644
--- a/test/unit/math/mix/prob/categorical_logit_glm_lpmf_test.cpp
+++ b/test/unit/math/mix/prob/categorical_logit_glm_lpmf_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, categorical_logit_glm_lpmf) {
+TEST_F(AgradRev, mathMixScalFun_categorical_logit_glm_lpmf) {
   auto f = [](const auto y) {
     return [=](const auto& x, const auto& alpha, const auto& beta) {
       return stan::math::categorical_logit_glm_lpmf(y, x, alpha, beta);
diff --git a/test/unit/math/mix/prob/categorical_logit_test.cpp b/test/unit/math/mix/prob/categorical_logit_test.cpp
index efd4e01efd3..f7b9217341b 100644
--- a/test/unit/math/mix/prob/categorical_logit_test.cpp
+++ b/test/unit/math/mix/prob/categorical_logit_test.cpp
@@ -1,9 +1,10 @@
 #include <stan/math/mix.hpp>
+#include <test/unit/math/test_ad.hpp>
 #include <gtest/gtest.h>
 #include <limits>
 #include <vector>
 
-TEST(ProbDistributionsCategoricalLogit, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsCategoricalLogit_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -28,7 +29,7 @@ TEST(ProbDistributionsCategoricalLogit, fvar_var) {
                   stan::math::categorical_logit_lpmf(3, theta).d_.val());
 }
 
-TEST(ProbDistributionsCategoricalLogit, fvar_var_vectorized) {
+TEST_F(AgradRev, ProbDistributionsCategoricalLogit_fvar_var_vectorized) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -58,7 +59,7 @@ TEST(ProbDistributionsCategoricalLogit, fvar_var_vectorized) {
                   stan::math::categorical_logit_lpmf(ms, theta).d_.val());
 }
 
-TEST(ProbDistributionsCategoricalLogit, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsCategoricalLogit_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -83,7 +84,7 @@ TEST(ProbDistributionsCategoricalLogit, fvar_fvar_var) {
                   stan::math::categorical_logit_lpmf(3, theta).d_.val_.val());
 }
 
-TEST(ProbDistributionsCategoricalLogit, fvar_fvar_var_vectorized) {
+TEST_F(AgradRev, ProbDistributionsCategoricalLogit_fvar_fvar_var_vectorized) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/categorical_test.cpp b/test/unit/math/mix/prob/categorical_test.cpp
index 0e6024b5387..fa54fc94d75 100644
--- a/test/unit/math/mix/prob/categorical_test.cpp
+++ b/test/unit/math/mix/prob/categorical_test.cpp
@@ -1,10 +1,11 @@
 #include <stan/math/mix.hpp>
+#include <test/unit/math/test_ad.hpp>
 #include <gtest/gtest.h>
 #include <boost/random/mersenne_twister.hpp>
 #include <boost/math/distributions.hpp>
 #include <vector>
 
-TEST(ProbDistributionsCategorical, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsCategorical_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -24,7 +25,7 @@ TEST(ProbDistributionsCategorical, fvar_var) {
   EXPECT_FLOAT_EQ(1.0 / 0.5, stan::math::categorical_lpmf(2, theta).d_.val());
   EXPECT_FLOAT_EQ(1.0 / 0.2, stan::math::categorical_lpmf(3, theta).d_.val());
 }
-TEST(ProbDistributionsCategorical, fvar_var_vector) {
+TEST_F(AgradRev, ProbDistributionsCategorical_fvar_var_vector) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -45,7 +46,7 @@ TEST(ProbDistributionsCategorical, fvar_var_vector) {
                   stan::math::categorical_lpmf(xs, theta).d_.val());
 }
 
-TEST(ProbDistributionsCategorical, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsCategorical_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -68,7 +69,7 @@ TEST(ProbDistributionsCategorical, fvar_fvar_var) {
   EXPECT_FLOAT_EQ(1.0 / 0.2,
                   stan::math::categorical_lpmf(3, theta).d_.val_.val());
 }
-TEST(ProbDistributionsCategorical, fvar_fvar_var_vector) {
+TEST_F(AgradRev, ProbDistributionsCategorical_fvar_fvar_var_vector) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/dirichlet_test.cpp b/test/unit/math/mix/prob/dirichlet_test.cpp
index cfddbddbaad..419dd83dccd 100644
--- a/test/unit/math/mix/prob/dirichlet_test.cpp
+++ b/test/unit/math/mix/prob/dirichlet_test.cpp
@@ -16,7 +16,7 @@ T vectorize_softmax(const T& y) {
 }
 }  // namespace dirichlet_test
 
-TEST(ProbDistributions, dirichlet) {
+TEST_F(AgradRev, ProbDistributions_dirichlet) {
   auto f = [](const auto& y, const auto& alpha) {
     auto y_simplex = dirichlet_test::vectorize_softmax(y);
     auto lp = stan::math::dirichlet_lpdf(y_simplex, alpha);
@@ -36,7 +36,7 @@ TEST(ProbDistributions, dirichlet) {
   stan::test::expect_ad(f, vs, vs);
 }
 
-TEST(ProbDistributions, fvar_var) {
+TEST_F(AgradRev, ProbDistributions_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -71,7 +71,7 @@ TEST(ProbDistributions, fvar_var) {
                   stan::math::dirichlet_lpdf(theta2, alpha2).d_.val());
 }
 
-TEST(ProbDistributions, fvar_varVectorized) {
+TEST_F(AgradRev, ProbDistributions_fvar_varVectorized) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::dirichlet_lpdf;
@@ -127,7 +127,7 @@ TEST(ProbDistributions, fvar_varVectorized) {
   EXPECT_FLOAT_EQ(result.d().val().sum(), out.d_.val());
 }
 
-TEST(ProbDistributions, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributions_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -162,7 +162,7 @@ TEST(ProbDistributions, fvar_fvar_var) {
                   stan::math::dirichlet_lpdf(theta2, alpha2).d_.val_.val());
 }
 
-TEST(ProbDistributions, fvar_fvar_varVectorized) {
+TEST_F(AgradRev, ProbDistributions_fvar_fvar_varVectorized) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::dirichlet_lpdf;
diff --git a/test/unit/math/mix/prob/gamma_cdf_log_test.cpp b/test/unit/math/mix/prob/gamma_cdf_log_test.cpp
index b2b60663610..185bc13c450 100644
--- a/test/unit/math/mix/prob/gamma_cdf_log_test.cpp
+++ b/test/unit/math/mix/prob/gamma_cdf_log_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, gamma_lcdf) {
+TEST_F(AgradRev, mathMixScalFun_gamma_lcdf) {
   auto f = [](const auto& y, const auto& alpha, const auto& beta) {
     return stan::math::gamma_lcdf(y, alpha, beta);
   };
diff --git a/test/unit/math/mix/prob/gaussian_dlm_obs_test.cpp b/test/unit/math/mix/prob/gaussian_dlm_obs_test.cpp
index 831c77235b4..93bb2cb57b5 100644
--- a/test/unit/math/mix/prob/gaussian_dlm_obs_test.cpp
+++ b/test/unit/math/mix/prob/gaussian_dlm_obs_test.cpp
@@ -1,7 +1,8 @@
 #include <stan/math/mix.hpp>
+#include <test/unit/math/test_ad.hpp>
 #include <gtest/gtest.h>
 
-TEST(ProbDistributionsGaussianDLM, LoglikeUU_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsGaussianDLM_LoglikeUU_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using Eigen::MatrixXd;
@@ -34,7 +35,7 @@ TEST(ProbDistributionsGaussianDLM, LoglikeUU_fvar_var) {
   EXPECT_FLOAT_EQ(-3.8427677, lp_ref.d_.val());
 }
 
-TEST(ProbDistributionsGaussianDLM, LoglikeMM_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsGaussianDLM_LoglikeMM_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using Eigen::MatrixXd;
@@ -87,7 +88,7 @@ TEST(ProbDistributionsGaussianDLM, LoglikeMM_fvar_var) {
   EXPECT_NEAR(18.89044287309947, lp_ref.d_.val(), 1e-4);
 }
 
-TEST(ProbDistributionsGaussianDLM, LoglikeUU_fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsGaussianDLM_LoglikeUU_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using Eigen::MatrixXd;
@@ -125,7 +126,7 @@ TEST(ProbDistributionsGaussianDLM, LoglikeUU_fvar_fvar_var) {
   EXPECT_FLOAT_EQ(-3.8427677, lp_ref.d_.val_.val());
 }
 
-TEST(ProbDistributionsGaussianDLM, LoglikeMM_fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsGaussianDLM_LoglikeMM_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using Eigen::MatrixXd;
diff --git a/test/unit/math/mix/prob/inv_wishart_cholesky_test.cpp b/test/unit/math/mix/prob/inv_wishart_cholesky_test.cpp
index 04e82242194..6309310197a 100644
--- a/test/unit/math/mix/prob/inv_wishart_cholesky_test.cpp
+++ b/test/unit/math/mix/prob/inv_wishart_cholesky_test.cpp
@@ -1,6 +1,7 @@
 #include <test/unit/math/test_ad.hpp>
+#include <test/unit/math/rev/fun/util.hpp>
 
-TEST(ProbDistributionsInvWishartCholesky, matvar) {
+TEST_F(AgradRev, ProbDistributionsInvWishartCholesky_matvar) {
   auto f = [](const auto& Y, const auto& dof, const auto& Sigma) {
     auto symmetric_Y = ((Y + Y.transpose()) * 0.5).eval();
     auto symmetric_Sigma = ((Sigma + Sigma.transpose()) * 0.5).eval();
@@ -38,7 +39,7 @@ TEST(ProbDistributionsInvWishartCholesky, matvar) {
   stan::test::expect_ad_matvar(f, Y11, dof, Sigma00);
 }
 
-TEST(ProbDistributionsInvWishartCholesky, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsInvWishartCholesky_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -73,7 +74,7 @@ TEST(ProbDistributionsInvWishartCholesky, fvar_var) {
   stan::math::recover_memory();
 }
 
-TEST(ProbDistributionsInvWishartCholesky, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsInvWishartCholesky_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/inv_wishart_test.cpp b/test/unit/math/mix/prob/inv_wishart_test.cpp
index 5f65fe23c27..c513b4a4cc0 100644
--- a/test/unit/math/mix/prob/inv_wishart_test.cpp
+++ b/test/unit/math/mix/prob/inv_wishart_test.cpp
@@ -1,6 +1,6 @@
 #include <test/unit/math/test_ad.hpp>
 
-TEST(ProbDistributionsInvWishart, matvar) {
+TEST_F(AgradRev, ProbDistributionsInvWishart_matvar) {
   auto f = [](const auto& y, const auto& dof, const auto& sigma) {
     auto y_sym = stan::math::multiply(0.5, y + y.transpose());
     auto sigma_sym = stan::math::multiply(0.5, sigma + sigma.transpose());
@@ -34,7 +34,7 @@ TEST(ProbDistributionsInvWishart, matvar) {
   stan::test::expect_ad_matvar(f, y11, dof, Sigma00);
 }
 
-TEST(ProbDistributionsInvWishart, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsInvWishart_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -66,7 +66,7 @@ TEST(ProbDistributionsInvWishart, fvar_var) {
   stan::math::recover_memory();
 }
 
-TEST(ProbDistributionsInvWishart, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsInvWishart_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/lkj_corr_test.cpp b/test/unit/math/mix/prob/lkj_corr_test.cpp
index 6d93e009c58..bb96388ade9 100644
--- a/test/unit/math/mix/prob/lkj_corr_test.cpp
+++ b/test/unit/math/mix/prob/lkj_corr_test.cpp
@@ -1,4 +1,5 @@
 #include <stan/math/mix.hpp>
+#include <test/unit/math/test_ad.hpp>
 #include <gtest/gtest.h>
 #include <test/unit/math/rev/prob/lkj_corr_cholesky_test_functors.hpp>
 #include <boost/random/mersenne_twister.hpp>
@@ -6,7 +7,7 @@
 #include <test/unit/math/mix/prob/higher_order_utils.hpp>
 #include <vector>
 
-TEST(ProbDistributionsLkjCorr, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsLkjCorr_fvar_var) {
   using stan::math::fvar;
   using stan::math::var;
   boost::random::mt19937 rng;
@@ -28,7 +29,7 @@ TEST(ProbDistributionsLkjCorr, fvar_var) {
   EXPECT_FLOAT_EQ(f.d_.val(), stan::math::lkj_corr_lpdf(Sigma, eta).d_.val());
 }
 
-TEST(ProbDistributionsLkjCorrCholesky, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsLkjCorrCholesky_fvar_var) {
   using stan::math::fvar;
   using stan::math::var;
   boost::random::mt19937 rng;
@@ -51,7 +52,7 @@ TEST(ProbDistributionsLkjCorrCholesky, fvar_var) {
   EXPECT_FLOAT_EQ(3, stan::math::lkj_corr_cholesky_lpdf(Sigma, eta).d_.val());
 }
 
-TEST(ProbDistributionsLkjCorr, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsLkjCorr_fvar_fvar_var) {
   using stan::math::fvar;
   using stan::math::var;
   boost::random::mt19937 rng;
@@ -75,7 +76,7 @@ TEST(ProbDistributionsLkjCorr, fvar_fvar_var) {
                   stan::math::lkj_corr_lpdf(Sigma, eta).d_.val_.val());
 }
 
-TEST(ProbDistributionsLkjCorrCholesky, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsLkjCorrCholesky_fvar_fvar_var) {
   using stan::math::fvar;
   using stan::math::var;
   boost::random::mt19937 rng;
@@ -101,7 +102,7 @@ TEST(ProbDistributionsLkjCorrCholesky, fvar_fvar_var) {
                   stan::math::lkj_corr_cholesky_lpdf(Sigma, eta).d_.val_.val());
 }
 
-TEST(ProbDistributionsLkjCorrCholesky, hessian) {
+TEST_F(AgradRev, ProbDistributionsLkjCorrCholesky_hessian) {
   int dim_mat = 3;
   Eigen::Matrix<double, Eigen::Dynamic, 1> x1(dim_mat);
   Eigen::Matrix<double, Eigen::Dynamic, 1> x2(1);
@@ -162,7 +163,7 @@ TEST(ProbDistributionsLkjCorrCholesky, hessian) {
   EXPECT_FLOAT_EQ(fx_hess_1, fx_hess_ad_1);
 }
 
-TEST(ProbDistributionsLkjCorrCholesky, grad_hessian) {
+TEST_F(AgradRev, ProbDistributionsLkjCorrCholesky_grad_hessian) {
   int dim_mat = 3;
   Eigen::Matrix<double, Eigen::Dynamic, 1> x1(dim_mat);
   Eigen::Matrix<double, Eigen::Dynamic, 1> x2(1);
diff --git a/test/unit/math/mix/prob/matrix_normal_prec_test.cpp b/test/unit/math/mix/prob/matrix_normal_prec_test.cpp
index ea9fd3c2a7f..500e840570a 100644
--- a/test/unit/math/mix/prob/matrix_normal_prec_test.cpp
+++ b/test/unit/math/mix/prob/matrix_normal_prec_test.cpp
@@ -1,6 +1,6 @@
 #include <test/unit/math/test_ad.hpp>
 
-TEST(ProbDistributionsMatrixNormal, matvar) {
+TEST_F(AgradRev, ProbDistributionsMatrixNormal_matvar) {
   auto f = [](const auto& y, const auto& mu, const auto& sigma, const auto& D) {
     auto sigma_sym = stan::math::multiply(0.5, sigma + sigma.transpose());
     auto D_sym = stan::math::multiply(0.5, D + D.transpose());
@@ -64,7 +64,7 @@ TEST(ProbDistributionsMatrixNormal, matvar) {
   stan::test::expect_ad_matvar(f, y1, mu1, Sigma00, D11);
 }
 
-TEST(ProbDistributionsMatrixNormal, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMatrixNormal_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -102,7 +102,7 @@ TEST(ProbDistributionsMatrixNormal, fvar_var) {
   stan::math::recover_memory();
 }
 
-TEST(ProbDistributionsMatrixNormal, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMatrixNormal_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/multi_gp_cholesky_test.cpp b/test/unit/math/mix/prob/multi_gp_cholesky_test.cpp
index ee6ac0a6ada..ef258a17497 100644
--- a/test/unit/math/mix/prob/multi_gp_cholesky_test.cpp
+++ b/test/unit/math/mix/prob/multi_gp_cholesky_test.cpp
@@ -1,7 +1,8 @@
 #include <stan/math/mix.hpp>
+#include <test/unit/math/test_ad.hpp>
 #include <gtest/gtest.h>
 
-TEST(ProbDistributionsMultiGPCholesky, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultiGPCholesky_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -48,7 +49,7 @@ TEST(ProbDistributionsMultiGPCholesky, fvar_var) {
   stan::math::recover_memory();
 }
 
-TEST(ProbDistributionsMultiGPCholesky, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultiGPCholesky_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/multi_gp_test.cpp b/test/unit/math/mix/prob/multi_gp_test.cpp
index 91b3f7c2248..9a4652ea341 100644
--- a/test/unit/math/mix/prob/multi_gp_test.cpp
+++ b/test/unit/math/mix/prob/multi_gp_test.cpp
@@ -2,7 +2,7 @@
 #include <gtest/gtest.h>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(ProbDistributionsMultiGP, matvar) {
+TEST_F(AgradRev, ProbDistributionsMultiGP_matvar) {
   auto f = [](const auto& y, const auto& sigma, const auto& w) {
     auto sigma_sym = stan::math::multiply(0.5, sigma + sigma.transpose());
     return stan::math::multi_gp_lpdf(y, sigma_sym, w);
@@ -46,7 +46,7 @@ TEST(ProbDistributionsMultiGP, matvar) {
   stan::test::expect_ad(f, y22, Sigma00, w0);
 }
 
-TEST(ProbDistributionsMultiGP, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultiGP_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -90,7 +90,7 @@ TEST(ProbDistributionsMultiGP, fvar_var) {
   stan::math::recover_memory();
 }
 
-TEST(ProbDistributionsMultiGP, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultiGP_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/multi_normal_cholesky_test.cpp b/test/unit/math/mix/prob/multi_normal_cholesky_test.cpp
index f8aea19e3f6..65f1e17a3e7 100644
--- a/test/unit/math/mix/prob/multi_normal_cholesky_test.cpp
+++ b/test/unit/math/mix/prob/multi_normal_cholesky_test.cpp
@@ -1,6 +1,6 @@
 #include <test/unit/math/test_ad.hpp>
 
-TEST(ProbDistributionsMultiNormalCholesky, matvar) {
+TEST_F(AgradRev, ProbDistributionsMultiNormalCholesky_matvar) {
   auto f = [](const auto& y, const auto& mu, const auto& sigma) {
     auto sigma_sym = stan::math::multiply(0.5, sigma + sigma.transpose());
     auto L = stan::math::cholesky_decompose(sigma_sym);
@@ -45,7 +45,7 @@ TEST(ProbDistributionsMultiNormalCholesky, matvar) {
   stan::test::expect_ad_matvar(f, y1, mu1, Sigma00);
 }
 
-TEST(ProbDistributionsMultiNormalCholesky, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultiNormalCholesky_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -73,7 +73,7 @@ TEST(ProbDistributionsMultiNormalCholesky, fvar_var) {
                   stan::math::multi_normal_cholesky_lpdf(y, mu, L).d_.val());
 }
 
-TEST(ProbDistributionsMultiNormalCholesky, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultiNormalCholesky_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/multi_normal_prec_test.cpp b/test/unit/math/mix/prob/multi_normal_prec_test.cpp
index 606c050af9e..5d8840db476 100644
--- a/test/unit/math/mix/prob/multi_normal_prec_test.cpp
+++ b/test/unit/math/mix/prob/multi_normal_prec_test.cpp
@@ -1,6 +1,6 @@
 #include <test/unit/math/test_ad.hpp>
 
-TEST(ProbDistributionsMultiNormalPrec, matvar) {
+TEST_F(AgradRev, ProbDistributionsMultiNormalPrec_matvar) {
   auto f = [](const auto& y, const auto& mu, const auto& sigma) {
     auto inv_sigma_sym = stan::math::multiply(0.5, sigma + sigma.transpose());
     return stan::math::multi_normal_prec_lpdf(y, mu, inv_sigma_sym);
@@ -37,7 +37,7 @@ TEST(ProbDistributionsMultiNormalPrec, matvar) {
   stan::test::expect_ad_matvar(f, y1, mu1, InvSigma00);
 }
 
-TEST(ProbDistributionsMultiNormalPrec, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultiNormalPrec_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -67,7 +67,7 @@ TEST(ProbDistributionsMultiNormalPrec, fvar_var) {
   stan::math::recover_memory();
 }
 
-TEST(ProbDistributionsMultiNormalPrec, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultiNormalPrec_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/multi_normal_test.cpp b/test/unit/math/mix/prob/multi_normal_test.cpp
index f5c9d507f48..7022ec9ff46 100644
--- a/test/unit/math/mix/prob/multi_normal_test.cpp
+++ b/test/unit/math/mix/prob/multi_normal_test.cpp
@@ -1,6 +1,6 @@
 #include <test/unit/math/test_ad.hpp>
 
-TEST(ProbDistributionsMultiNormal, matvar) {
+TEST_F(AgradRev, ProbDistributionsMultiNormal_matvar) {
   auto f = [](const auto& y, const auto& mu, const auto& sigma) {
     auto sigma_sym = stan::math::multiply(0.5, sigma + sigma.transpose());
     return stan::math::multi_normal_lpdf(y, mu, sigma_sym);
@@ -47,7 +47,7 @@ TEST(ProbDistributionsMultiNormal, matvar) {
   stan::test::expect_ad_matvar(f, y1, mu1, Sigma00);
 }
 
-TEST(ProbDistributionsMultiNormal, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultiNormal_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -74,7 +74,7 @@ TEST(ProbDistributionsMultiNormal, fvar_var) {
   stan::math::recover_memory();
 }
 
-TEST(ProbDistributionsMultiNormal, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultiNormal_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/multi_student_t_test.cpp b/test/unit/math/mix/prob/multi_student_t_test.cpp
index a74881fe6da..88b3d2b51d6 100644
--- a/test/unit/math/mix/prob/multi_student_t_test.cpp
+++ b/test/unit/math/mix/prob/multi_student_t_test.cpp
@@ -1,6 +1,6 @@
 #include <test/unit/math/test_ad.hpp>
 
-TEST(ProbDistributionsMultiStudentT, matvar) {
+TEST_F(AgradRev, ProbDistributionsMultiStudentT_matvar) {
   auto f
       = [](const auto& y, const auto& nu, const auto& mu, const auto& sigma) {
           auto sigma_sym = stan::math::multiply(0.5, sigma + sigma.transpose());
@@ -58,7 +58,7 @@ TEST(ProbDistributionsMultiStudentT, matvar) {
   stan::test::expect_ad_matvar(f, y1, nu, mu1, Sigma00);
 }
 
-TEST(ProbDistributionsMultiStudentT, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultiStudentT_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -87,7 +87,7 @@ TEST(ProbDistributionsMultiStudentT, fvar_var) {
   stan::math::recover_memory();
 }
 
-TEST(ProbDistributionsMultiStudentT, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultiStudentT_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/multinomial_logit_test.cpp b/test/unit/math/mix/prob/multinomial_logit_test.cpp
index de8a3e1296c..1c6e54767f4 100644
--- a/test/unit/math/mix/prob/multinomial_logit_test.cpp
+++ b/test/unit/math/mix/prob/multinomial_logit_test.cpp
@@ -1,6 +1,6 @@
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, multinomialLogit) {
+TEST_F(AgradRev, mathMixScalFun_multinomialLogit) {
   std::vector<int> ns{0, 1, 2, 3};
   Eigen::VectorXd beta(4);
   beta << 0.1, 0.1, 0.5, 0.3;
diff --git a/test/unit/math/mix/prob/multinomial_test.cpp b/test/unit/math/mix/prob/multinomial_test.cpp
index c8f706a7580..96f0bfbd59e 100644
--- a/test/unit/math/mix/prob/multinomial_test.cpp
+++ b/test/unit/math/mix/prob/multinomial_test.cpp
@@ -1,10 +1,11 @@
 #include <stan/math/mix.hpp>
+#include <test/unit/math/test_ad.hpp>
 #include <gtest/gtest.h>
 #include <boost/random/mersenne_twister.hpp>
 #include <boost/math/distributions.hpp>
 #include <vector>
 
-TEST(ProbDistributionsMultinomial, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultinomial_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -23,7 +24,7 @@ TEST(ProbDistributionsMultinomial, fvar_var) {
   EXPECT_FLOAT_EQ(17.666666, stan::math::multinomial_lpmf(ns, theta).d_.val());
 }
 
-TEST(ProbDistributionsMultinomial, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsMultinomial_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/neg_binomial_2_log_glm_lpmf_test.cpp b/test/unit/math/mix/prob/neg_binomial_2_log_glm_lpmf_test.cpp
index 92d8e42754f..5934aaf04b2 100644
--- a/test/unit/math/mix/prob/neg_binomial_2_log_glm_lpmf_test.cpp
+++ b/test/unit/math/mix/prob/neg_binomial_2_log_glm_lpmf_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, neg_binomial_2_log_glm_lpmf) {
+TEST_F(AgradRev, mathMixScalFun_neg_binomial_2_log_glm_lpmf) {
   auto f = [](const auto y, const auto& x) {
     return [=](const auto& alpha, const auto& beta, const auto& phi) {
       return stan::math::neg_binomial_2_log_glm_lpmf(y, x, alpha, beta, phi);
diff --git a/test/unit/math/mix/prob/neg_binomial_2_log_test.cpp b/test/unit/math/mix/prob/neg_binomial_2_log_test.cpp
index a04071c0ccb..2ef7f77b49d 100644
--- a/test/unit/math/mix/prob/neg_binomial_2_log_test.cpp
+++ b/test/unit/math/mix/prob/neg_binomial_2_log_test.cpp
@@ -3,7 +3,7 @@
 #include <gtest/gtest.h>
 #include <boost/math/differentiation/finite_difference.hpp>
 
-TEST(mathMixScalFun, neg_binomial_2_log_lpmf_derivatives) {
+TEST_F(AgradRev, mathMixScalFun_neg_binomial_2_log_lpmf_derivatives) {
   auto f1 = [](const auto& eta, const auto& phi) {
     return stan::math::neg_binomial_2_log_lpmf(0, eta, phi);
   };
diff --git a/test/unit/math/mix/prob/neg_binomial_test.cpp b/test/unit/math/mix/prob/neg_binomial_test.cpp
index a17998ded93..7d69ade8b1c 100644
--- a/test/unit/math/mix/prob/neg_binomial_test.cpp
+++ b/test/unit/math/mix/prob/neg_binomial_test.cpp
@@ -3,7 +3,7 @@
 #include <gtest/gtest.h>
 #include <boost/math/differentiation/finite_difference.hpp>
 
-TEST(mathMixScalFun, neg_binomial_lpmf_derivatives) {
+TEST_F(AgradRev, mathMixScalFun_neg_binomial_lpmf_derivatives) {
   auto f = [](const int y) {
     return [=](const auto& alpha, const auto& beta) {
       return stan::math::neg_binomial_lpmf(y, alpha, beta);
diff --git a/test/unit/math/mix/prob/normal_ccdf_log_test.cpp b/test/unit/math/mix/prob/normal_ccdf_log_test.cpp
index 7c0cfc41b0b..e573e7da289 100644
--- a/test/unit/math/mix/prob/normal_ccdf_log_test.cpp
+++ b/test/unit/math/mix/prob/normal_ccdf_log_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, normal_lccdf) {
+TEST_F(AgradRev, mathMixScalFun_normal_lccdf) {
   auto f = [](const double mu, const double sigma) {
     return
         [=](const auto& y) { return stan::math::normal_lccdf(y, mu, sigma); };
diff --git a/test/unit/math/mix/prob/normal_cdf_log_test.cpp b/test/unit/math/mix/prob/normal_cdf_log_test.cpp
index 38560deda7b..7a737c87c77 100644
--- a/test/unit/math/mix/prob/normal_cdf_log_test.cpp
+++ b/test/unit/math/mix/prob/normal_cdf_log_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, normal_lcdf) {
+TEST_F(AgradRev, mathMixScalFun_normal_lcdf) {
   auto f = [](const double mu, const double sigma) {
     return [=](const auto& y) { return stan::math::normal_lcdf(y, mu, sigma); };
   };
diff --git a/test/unit/math/mix/prob/normal_cdf_test.cpp b/test/unit/math/mix/prob/normal_cdf_test.cpp
index 80e85c3ac4f..a73594c447f 100644
--- a/test/unit/math/mix/prob/normal_cdf_test.cpp
+++ b/test/unit/math/mix/prob/normal_cdf_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, normal_cdf) {
+TEST_F(AgradRev, mathMixScalFun_normal_cdf) {
   auto f = [](const double mu, const double sigma) {
     return [=](const auto& y) { return stan::math::normal_cdf(y, mu, sigma); };
   };
diff --git a/test/unit/math/mix/prob/normal_id_glm_lpdf_test.cpp b/test/unit/math/mix/prob/normal_id_glm_lpdf_test.cpp
index 3af9083a628..f38537c3c08 100644
--- a/test/unit/math/mix/prob/normal_id_glm_lpdf_test.cpp
+++ b/test/unit/math/mix/prob/normal_id_glm_lpdf_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, normal_id_glm_lpdf) {
+TEST_F(AgradRev, mathMixScalFun_normal_id_glm_lpdf) {
   auto f = [](const auto& y, const auto& x) {
     return [=](const auto& alpha, const auto& beta, const auto& sigma) {
       return stan::math::normal_id_glm_lpdf(y, x, alpha, beta, sigma);
diff --git a/test/unit/math/mix/prob/normal_test.cpp b/test/unit/math/mix/prob/normal_test.cpp
index 81136b202d2..029c9ada73d 100644
--- a/test/unit/math/mix/prob/normal_test.cpp
+++ b/test/unit/math/mix/prob/normal_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, normal_lpdf) {
+TEST_F(AgradRev, mathMixScalFun_normal_lpdf) {
   auto f = [](const double mu, const double sigma) {
     return [=](const auto& y) { return stan::math::normal_lpdf(y, mu, sigma); };
   };
diff --git a/test/unit/math/mix/prob/ordered_logistic_glm_lpmf_test.cpp b/test/unit/math/mix/prob/ordered_logistic_glm_lpmf_test.cpp
index db0a34f9d92..b4791cdbed5 100644
--- a/test/unit/math/mix/prob/ordered_logistic_glm_lpmf_test.cpp
+++ b/test/unit/math/mix/prob/ordered_logistic_glm_lpmf_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, ordered_logistic_glm_lpmf) {
+TEST_F(AgradRev, mathMixScalFun_ordered_logistic_glm_lpmf) {
   auto f = [](const auto y) {
     return [=](const auto& x, const auto& beta, const auto& cutpoints) {
       return stan::math::ordered_logistic_glm_lpmf(y, x, beta, cutpoints);
diff --git a/test/unit/math/mix/prob/ordered_logistic_test.cpp b/test/unit/math/mix/prob/ordered_logistic_test.cpp
index 8270e873c80..c749d754223 100644
--- a/test/unit/math/mix/prob/ordered_logistic_test.cpp
+++ b/test/unit/math/mix/prob/ordered_logistic_test.cpp
@@ -1,9 +1,10 @@
 #include <stan/math/mix.hpp>
+#include <test/unit/math/test_ad.hpp>
 #include <test/unit/math/rev/fun/util.hpp>
 #include <gtest/gtest.h>
 #include <vector>
 
-TEST(ProbDistributionsOrdLog, fv_fv) {
+TEST_F(AgradRev, ProbDistributionsOrdLog_fv_fv) {
   using stan::math::fvar;
   using stan::math::ordered_logistic_lpmf;
   using stan::math::var;
@@ -54,7 +55,7 @@ TEST(ProbDistributionsOrdLog, fv_fv) {
   EXPECT_FLOAT_EQ(c_ffv[2].d_.val_.adj(), 0.0);
 }
 
-TEST(ProbDistributionsOrdLog, fv_d) {
+TEST_F(AgradRev, ProbDistributionsOrdLog_fv_d) {
   using stan::math::fvar;
   using stan::math::ordered_logistic_lpmf;
   using stan::math::var;
@@ -122,7 +123,7 @@ TEST(ProbDistributionsOrdLog, fv_d) {
   EXPECT_FLOAT_EQ(c_ffv[2].d_.val_.adj(), 0.0);
 }
 
-TEST(ProbDistributionsOrdLog, fv_fv_vec) {
+TEST_F(AgradRev, ProbDistributionsOrdLog_fv_fv_vec) {
   using stan::math::fvar;
   using stan::math::ordered_logistic_lpmf;
   using stan::math::var;
@@ -187,7 +188,7 @@ TEST(ProbDistributionsOrdLog, fv_fv_vec) {
   EXPECT_FLOAT_EQ(c_ffv[2].d_.val_.adj(), 0.557132795804491);
 }
 
-TEST(ProbDistributionsOrdLog, fv_d_vec) {
+TEST_F(AgradRev, ProbDistributionsOrdLog_fv_d_vec) {
   using stan::math::fvar;
   using stan::math::ordered_logistic_lpmf;
   using stan::math::var;
@@ -270,7 +271,7 @@ TEST(ProbDistributionsOrdLog, fv_d_vec) {
   EXPECT_FLOAT_EQ(c_ffv[2].d_.val_.adj(), 1.20737912023631);
 }
 
-TEST(ProbDistributionsOrdLog, fv_fv_stvec) {
+TEST_F(AgradRev, ProbDistributionsOrdLog_fv_fv_stvec) {
   using stan::math::fvar;
   using stan::math::ordered_logistic_lpmf;
   using stan::math::var;
@@ -398,7 +399,7 @@ TEST(ProbDistributionsOrdLog, fv_fv_stvec) {
   EXPECT_FLOAT_EQ(std_c_ffv[3][2].d_.val_.adj(), -0.497500020833125);
 }
 
-TEST(ProbDistributionsOrdLog, fv_d_stvec) {
+TEST_F(AgradRev, ProbDistributionsOrdLog_fv_d_stvec) {
   using stan::math::fvar;
   using stan::math::ordered_logistic_lpmf;
   using stan::math::var;
diff --git a/test/unit/math/mix/prob/poisson_log_glm_lpmf_test.cpp b/test/unit/math/mix/prob/poisson_log_glm_lpmf_test.cpp
index 081b5816344..87292183450 100644
--- a/test/unit/math/mix/prob/poisson_log_glm_lpmf_test.cpp
+++ b/test/unit/math/mix/prob/poisson_log_glm_lpmf_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, poisson_log_glm_lpmf) {
+TEST_F(AgradRev, mathMixScalFun_poisson_log_glm_lpmf) {
   auto f = [](const auto y) {
     return [=](const auto& x, const auto& alpha, const auto& beta) {
       return stan::math::poisson_log_glm_lpmf(y, x, alpha, beta);
diff --git a/test/unit/math/mix/prob/std_normal_ccdf_log_test.cpp b/test/unit/math/mix/prob/std_normal_ccdf_log_test.cpp
index 7aed750e4c2..3c2b01d395a 100644
--- a/test/unit/math/mix/prob/std_normal_ccdf_log_test.cpp
+++ b/test/unit/math/mix/prob/std_normal_ccdf_log_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, std_normal_lccdf) {
+TEST_F(AgradRev, mathMixScalFun_std_normal_lccdf) {
   auto f = [](const auto& y) { return stan::math::std_normal_lccdf(y); };
 
   stan::test::expect_ad(f, -50.0);
diff --git a/test/unit/math/mix/prob/std_normal_cdf_log_test.cpp b/test/unit/math/mix/prob/std_normal_cdf_log_test.cpp
index 3bc6ee837f6..7f566f3452f 100644
--- a/test/unit/math/mix/prob/std_normal_cdf_log_test.cpp
+++ b/test/unit/math/mix/prob/std_normal_cdf_log_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, std_normal_lcdf) {
+TEST_F(AgradRev, mathMixScalFun_std_normal_lcdf) {
   auto f = [](const auto& y) { return stan::math::std_normal_lcdf(y); };
 
   stan::test::expect_ad(f, -50.0);
diff --git a/test/unit/math/mix/prob/std_normal_cdf_test.cpp b/test/unit/math/mix/prob/std_normal_cdf_test.cpp
index 008203b6b7d..f19e47d5d81 100644
--- a/test/unit/math/mix/prob/std_normal_cdf_test.cpp
+++ b/test/unit/math/mix/prob/std_normal_cdf_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, std_normal_cdf) {
+TEST_F(AgradRev, mathMixScalFun_std_normal_cdf) {
   auto f = [](const auto& y) { return stan::math::std_normal_cdf(y); };
 
   stan::test::expect_ad(f, -50.0);
diff --git a/test/unit/math/mix/prob/std_normal_log_qf_test.cpp b/test/unit/math/mix/prob/std_normal_log_qf_test.cpp
index d71498a2a4e..1ae44dd9c27 100644
--- a/test/unit/math/mix/prob/std_normal_log_qf_test.cpp
+++ b/test/unit/math/mix/prob/std_normal_log_qf_test.cpp
@@ -4,7 +4,7 @@
 #include <test/unit/math/test_ad.hpp>
 #include <stan/math/fwd/prob/std_normal_log_qf.hpp>
 
-TEST(mathMixLogFun, stdNormalLogQf) {
+TEST_F(AgradRev, mathMixLogFun_stdNormalLogQf) {
   auto f = [](const auto& x1) { return stan::math::std_normal_log_qf(x1); };
   stan::test::expect_ad(f, -100.25);
   stan::test::expect_unary_vectorized(
@@ -14,7 +14,7 @@ TEST(mathMixLogFun, stdNormalLogQf) {
   stan::test::expect_unary_vectorized(f, log(0.02425), log(0.97575));
 }
 
-TEST(mathMixScalLogFun, stdNormalLogQfInt) {
+TEST_F(AgradRev, mathMixScalLogFun_stdNormalLogQfInt) {
   auto f = [](const auto& x1) { return stan::math::std_normal_log_qf(x1); };
   int y = 1;
   stan::test::expect_ad(f, y);
@@ -22,7 +22,7 @@ TEST(mathMixScalLogFun, stdNormalLogQfInt) {
   stan::test::expect_ad(f, y);
 }
 
-TEST(mathMixZeroLogFun, stdNormalLogQfZero) {
+TEST_F(AgradRev, mathMixZeroLogFun_stdNormalLogQfZero) {
   auto f = [](const auto& x1) { return stan::math::std_normal_log_qf(x1); };
   int y_int = 0;
   stan::test::expect_ad(f, y_int);
@@ -31,7 +31,7 @@ TEST(mathMixZeroLogFun, stdNormalLogQfZero) {
   stan::test::expect_ad(f, y);
 }
 
-TEST(mathMixMatFunLog, stdNormalLogQfVarmat) {
+TEST_F(AgradRev, mathMixMatFunLog_stdNormalLogQfVarmat) {
   using stan::math::vec_concat;
   using stan::test::expect_ad_vector_matvar;
   using stan::test::internal::common_args;
diff --git a/test/unit/math/mix/prob/std_normal_test.cpp b/test/unit/math/mix/prob/std_normal_test.cpp
index 5638d9d7481..22a3483409a 100644
--- a/test/unit/math/mix/prob/std_normal_test.cpp
+++ b/test/unit/math/mix/prob/std_normal_test.cpp
@@ -1,7 +1,7 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
 
-TEST(mathMixScalFun, std_normal) {
+TEST_F(AgradRev, mathMixScalFun_std_normal) {
   auto f = [](const auto& y) { return stan::math::std_normal_lpdf(y); };
 
   stan::test::expect_ad(f, -0.3);
diff --git a/test/unit/math/mix/prob/von_mises_cdf_test.cpp b/test/unit/math/mix/prob/von_mises_cdf_test.cpp
index 3443bbfc202..2f5630e3341 100644
--- a/test/unit/math/mix/prob/von_mises_cdf_test.cpp
+++ b/test/unit/math/mix/prob/von_mises_cdf_test.cpp
@@ -1,7 +1,7 @@
 #include <test/unit/math/test_ad.hpp>
 #include <limits>
 
-TEST(mathMixScalFun, von_mises_cdf) {
+TEST_F(AgradRev, mathMixScalFun_von_mises_cdf) {
   auto f = [](const auto& x, const auto& mu, const auto& k) {
     return stan::math::von_mises_cdf(x, mu, k);
   };
diff --git a/test/unit/math/mix/prob/von_mises_test.cpp b/test/unit/math/mix/prob/von_mises_test.cpp
index 6d959523201..4035b80ca79 100644
--- a/test/unit/math/mix/prob/von_mises_test.cpp
+++ b/test/unit/math/mix/prob/von_mises_test.cpp
@@ -1,7 +1,10 @@
 #include <stan/math/mix.hpp>
 #include <test/unit/math/test_ad.hpp>
+#include <test/unit/math/rev/fun/util.hpp>
+#include <gtest/gtest.h>
+#include <vector>
 
-TEST(mathMixScalFun, von_mises_lpdf) {
+TEST_F(AgradRev, mathMixScalFun_von_mises_lpdf) {
   auto f = [](const auto& y, const auto& mu, const auto& kappa) {
     return stan::math::von_mises_lpdf(y, mu, kappa);
   };
diff --git a/test/unit/math/mix/prob/wishart_cholesky_test.cpp b/test/unit/math/mix/prob/wishart_cholesky_test.cpp
index abefb023b62..6bea6752b50 100644
--- a/test/unit/math/mix/prob/wishart_cholesky_test.cpp
+++ b/test/unit/math/mix/prob/wishart_cholesky_test.cpp
@@ -1,6 +1,7 @@
 #include <test/unit/math/test_ad.hpp>
+#include <test/unit/math/rev/fun/util.hpp>
 
-TEST(ProbDistributionsWishartCholesky, matvar) {
+TEST_F(AgradRev, ProbDistributionsWishartCholesky_matvar) {
   auto f = [](const auto& Y, const auto& dof, const auto& Sigma) {
     auto symmetric_Y = ((Y + Y.transpose()) * 0.5).eval();
     auto symmetric_Sigma = ((Sigma + Sigma.transpose()) * 0.5).eval();
@@ -38,7 +39,7 @@ TEST(ProbDistributionsWishartCholesky, matvar) {
   stan::test::expect_ad_matvar(f, Y11, dof, Sigma00);
 }
 
-TEST(ProbDistributionsWishartCholesky, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsWishartCholesky_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -71,7 +72,7 @@ TEST(ProbDistributionsWishartCholesky, fvar_var) {
   stan::math::recover_memory();
 }
 
-TEST(ProbDistributionsWishartCholesky, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsWishartCholesky_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/mix/prob/wishart_test.cpp b/test/unit/math/mix/prob/wishart_test.cpp
index 9dbc107c8c7..1683d786a53 100644
--- a/test/unit/math/mix/prob/wishart_test.cpp
+++ b/test/unit/math/mix/prob/wishart_test.cpp
@@ -1,6 +1,6 @@
 #include <test/unit/math/test_ad.hpp>
 
-TEST(ProbDistributionsWishart, matvar) {
+TEST_F(AgradRev, ProbDistributionsWishart_matvar) {
   auto f = [](const auto& y, const auto& dof, const auto& sigma) {
     auto y_sym = stan::math::multiply(0.5, y + y.transpose());
     auto sigma_sym = stan::math::multiply(0.5, sigma + sigma.transpose());
@@ -34,7 +34,7 @@ TEST(ProbDistributionsWishart, matvar) {
   stan::test::expect_ad_matvar(f, y11, dof, Sigma00);
 }
 
-TEST(ProbDistributionsWishart, fvar_var) {
+TEST_F(AgradRev, ProbDistributionsWishart_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
@@ -61,7 +61,7 @@ TEST(ProbDistributionsWishart, fvar_var) {
   stan::math::recover_memory();
 }
 
-TEST(ProbDistributionsWishart, fvar_fvar_var) {
+TEST_F(AgradRev, ProbDistributionsWishart_fvar_fvar_var) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fvar;
diff --git a/test/unit/math/rev/core/arena_matrix_test.cpp b/test/unit/math/rev/core/arena_matrix_test.cpp
index cb339ae73bd..f67650c1a84 100644
--- a/test/unit/math/rev/core/arena_matrix_test.cpp
+++ b/test/unit/math/rev/core/arena_matrix_test.cpp
@@ -21,6 +21,7 @@ TEST_F(AgradRev, arena_matrix_matrix_test) {
   a = c;
   a2 = std::move(d);
   a3 = 2 * a;
+
   b = d;
   b2 = std::move(c);
   e = e + a;
@@ -239,3 +240,13 @@ TEST_F(AgradRev, arena_sparse_matrix_inplace_ops) {
   }
   expect_sparse_dense_matrix_equal(A_m, C);
 }
+
+TEST(AgradRevArenaMat, arena_matrix_move_test) {
+  using stan::math::arena_matrix;
+  Eigen::VectorXd c = Eigen::VectorXd::Random(3);
+  Eigen::VectorXd d = c;
+  arena_matrix<Eigen::VectorXd> a(std::move(c));
+  EXPECT_MATRIX_EQ(a, d);
+  EXPECT_EQ(stan::math::ChainableStack::instance_->var_alloc_stack_.size(), 1);
+  stan::math::recover_memory();
+}
diff --git a/test/unit/math/rev/fun/fill_test.cpp b/test/unit/math/rev/fun/fill_test.cpp
index 5a3fb8476b0..7dae163c0f7 100644
--- a/test/unit/math/rev/fun/fill_test.cpp
+++ b/test/unit/math/rev/fun/fill_test.cpp
@@ -1,9 +1,10 @@
 #include <stan/math/rev.hpp>
-#include <gtest/gtest.h>
 #include <test/unit/math/rev/fun/util.hpp>
+#include <test/unit/math/rev/util.hpp>
+#include <gtest/gtest.h>
 #include <vector>
 
-TEST(AgradRevMatrix, fill) {
+TEST_F(AgradRev, fill) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fill;
@@ -43,7 +44,7 @@ TEST(AgradRevMatrix, fill) {
     for (size_t j = 0; j < 2; ++j)
       EXPECT_FLOAT_EQ(54, d[i][j].val());
 }
-TEST(AgradRevMatrix, fillDouble) {
+TEST_F(AgradRev, fillDouble) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fill;
@@ -53,13 +54,14 @@ TEST(AgradRevMatrix, fillDouble) {
   EXPECT_FLOAT_EQ(3.0, y[0]);
 }
 
-TEST(AgradRevMatrix, fillVarMatDouble) {
+TEST_F(AgradRev, fillVarMatDouble) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fill;
   using stan::math::sum;
   using stan::math::var_value;
-  Matrix<double, Dynamic, 1> y_val(3);
+  Matrix<double, Dynamic, 1> y_val
+      = Matrix<double, Dynamic, 1>::Constant(3, 2.0);
   var_value<Matrix<double, Dynamic, 1>> y(y_val);
   fill(y, 3.0);
   EXPECT_EQ(3, y.size());
@@ -71,14 +73,15 @@ TEST(AgradRevMatrix, fillVarMatDouble) {
   }
 }
 
-TEST(AgradRevMatrix, fillVarMatVar) {
+TEST_F(AgradRev, fillVarMatVar) {
   using Eigen::Dynamic;
   using Eigen::Matrix;
   using stan::math::fill;
   using stan::math::sum;
   using stan::math::var;
   using stan::math::var_value;
-  Matrix<double, Dynamic, 1> y_val(3);
+  Matrix<double, Dynamic, 1> y_val
+      = Matrix<double, Dynamic, 1>::Constant(3, 2.0);
   var_value<Matrix<double, Dynamic, 1>> y(y_val);
   var z(3.0);
   fill(y, z);
diff --git a/test/unit/math/rev/fun/to_soa_sparse_matrix_test.cpp b/test/unit/math/rev/fun/to_soa_sparse_matrix_test.cpp
new file mode 100644
index 00000000000..fbc495ac432
--- /dev/null
+++ b/test/unit/math/rev/fun/to_soa_sparse_matrix_test.cpp
@@ -0,0 +1,75 @@
+#include <iostream>
+#include <stan/math/prim/fun/Eigen.hpp>
+#include <stan/math/rev/fun/to_soa_sparse_matrix.hpp>
+#include <stan/math/rev/core.hpp>
+#include <test/unit/math/rev/util.hpp>
+#include <vector>
+
+TEST_F(AgradRev, to_soa_sparse_matrix_matrix_double) {
+  using stan::math::to_soa_sparse_matrix;
+  using stan::math::var;
+  using stan::math::var_value;
+  std::vector<int> v{0, 1, 2, 0, 1};
+  std::vector<int> u{0, 1, 2, 3, 4, 5};
+  Eigen::VectorXd w(5);
+  int m = 5;
+  int n = 5;
+  w << 1, 2, 3, 4, 5;
+  var_value<Eigen::SparseMatrix<double, Eigen::RowMajor>> w_mat_arena
+      = to_soa_sparse_matrix<Eigen::RowMajor>(m, n, w, u, v);
+  for (int i = 0; i < 5; ++i) {
+    EXPECT_EQ(w_mat_arena.val().valuePtr()[i], w(i));
+  }
+}
+
+TEST_F(AgradRev, to_soa_sparse_matrix_matrix_var) {
+  using stan::math::to_soa_sparse_matrix;
+  using stan::math::var;
+  using stan::math::var_value;
+  std::vector<int> v{0, 1, 2, 0, 1};
+  std::vector<int> u{0, 1, 2, 3, 4, 5};
+  Eigen::VectorXd w(5);
+  int m = 5;
+  int n = 5;
+  w << 1, 2, 3, 4, 5;
+  Eigen::Matrix<var, -1, 1> w_var(w);
+  var_value<Eigen::SparseMatrix<double, Eigen::RowMajor>> w_mat_arena
+      = to_soa_sparse_matrix<Eigen::RowMajor>(m, n, w_var, u, v);
+  for (int i = 0; i < 5; ++i) {
+    EXPECT_EQ(w_mat_arena.val().valuePtr()[i], w.val()(i));
+  }
+}
+
+TEST_F(AgradRev, to_soa_sparse_matrix_var_matrix) {
+  using stan::math::to_soa_sparse_matrix;
+  using stan::math::var;
+  using stan::math::var_value;
+  std::vector<int> v{0, 1, 2, 0, 1};
+  std::vector<int> u{0, 1, 2, 3, 4, 5};
+  Eigen::VectorXd w(5);
+  int m = 5;
+  int n = 5;
+  w << 1, 2, 3, 4, 5;
+  var_value<Eigen::VectorXd> w_var(w);
+  var_value<Eigen::SparseMatrix<double, Eigen::RowMajor>> w_mat_arena
+      = to_soa_sparse_matrix<Eigen::RowMajor>(m, n, w_var, u, v);
+  for (int i = 0; i < 5; ++i) {
+    EXPECT_EQ(w_mat_arena.val().valuePtr()[i], w.val()(i));
+  }
+  // Changing this value should change the adjoint of the sparse matrix
+  for (int i = 0; i < 5; ++i) {
+    w_mat_arena.adj().valuePtr()[i] = i;
+  }
+  for (int i = 0; i < 5; ++i) {
+    EXPECT_EQ(w_mat_arena.adj().valuePtr()[i], w_var.adj()(i));
+  }
+  for (int i = 0; i < 5; ++i) {
+    w_mat_arena.adj().valuePtr()[i] = 0;
+  }
+  for (int i = 0; i < 5; ++i) {
+    w_var.adj().coeffRef(i) = i;
+  }
+  for (int i = 0; i < 5; ++i) {
+    EXPECT_EQ(w_mat_arena.adj().valuePtr()[i], w_var.adj()(i));
+  }
+}
diff --git a/test/unit/math/rev/util.hpp b/test/unit/math/rev/util.hpp
index 87db3580415..3725aa1da0b 100644
--- a/test/unit/math/rev/util.hpp
+++ b/test/unit/math/rev/util.hpp
@@ -10,6 +10,10 @@ struct AgradRev : public testing::Test {
     // make sure memory's clean before starting each test
     stan::math::recover_memory();
   }
+  void TearDown() {
+    // make sure memory's clean after each test
+    stan::math::recover_memory();
+  }
 };
 
 namespace stan {
diff --git a/test/unit/math/test_ad.hpp b/test/unit/math/test_ad.hpp
index 7d7547bdbd9..0cd8c9759e1 100644
--- a/test/unit/math/test_ad.hpp
+++ b/test/unit/math/test_ad.hpp
@@ -8,12 +8,13 @@
 #include <test/unit/math/expect_near_rel.hpp>
 #include <test/unit/math/test_ad_matvar.hpp>
 #include <test/unit/util.hpp>
+#include <test/unit/math/rev/util.hpp>
 #include <gtest/gtest.h>
 #include <algorithm>
 #include <cmath>
 #include <string>
 #include <vector>
-
+#include <test/unit/math/test_ad.hpp>
 using d_t = double;
 using v_t = stan::math::var;
 using fd_t = stan::math::fvar<d_t>;