Merge pull request #3211 from stan-dev/student-t-qf

SteveBronder · web-flow · commit a37a37cde090 · 2026-05-05T15:42:04.000-04:00
Add quantile function for Student-T distribution
diff --git a/stan/math/fwd/prob.hpp b/stan/math/fwd/prob.hpp
@@ -5,5 +5,6 @@
 #include <stan/math/fwd/fun/Eigen_NumTraits.hpp>
 
 #include <stan/math/fwd/prob/std_normal_log_qf.hpp>
+#include <stan/math/fwd/prob/student_t_qf.hpp>
 
 #endif
diff --git a/stan/math/fwd/prob/student_t_qf.hpp b/stan/math/fwd/prob/student_t_qf.hpp
@@ -0,0 +1,94 @@
+#ifndef STAN_MATH_FWD_PROB_STUDENT_T_QF_HPP
+#define STAN_MATH_FWD_PROB_STUDENT_T_QF_HPP
+
+#include <stan/math/fwd/meta.hpp>
+#include <stan/math/fwd/fun/digamma.hpp>
+#include <stan/math/fwd/fun/exp.hpp>
+#include <stan/math/fwd/fun/hypergeometric_2F1.hpp>
+#include <stan/math/fwd/fun/hypergeometric_pFq.hpp>
+#include <stan/math/fwd/fun/inv_inc_beta.hpp>
+#include <stan/math/fwd/fun/log.hpp>
+#include <stan/math/fwd/fun/sqrt.hpp>
+#include <stan/math/fwd/fun/value_of.hpp>
+#include <stan/math/fwd/fun/value_of_rec.hpp>
+#include <stan/math/prim/meta.hpp>
+#include <stan/math/prim/prob/student_t_lpdf.hpp>
+
+namespace stan {
+namespace math {
+
+template <typename T_p, typename T_nu, typename T_mu, typename T_sigma,
+          require_all_stan_scalar_t<T_p, T_mu, T_sigma, T_nu>* = nullptr,
+          require_any_fvar_t<T_p, T_nu, T_mu, T_sigma>* = nullptr>
+inline auto student_t_qf(const T_p& p, const T_nu& nu, const T_mu& mu,
+                         const T_sigma& sigma) {
+  static constexpr const char* function = "student_t_qf";
+  using FvarT = return_type_t<T_p, T_mu, T_sigma, T_nu>;
+  using T_partials = partials_type_t<FvarT>;
+
+  auto p_val = value_of(p);
+  auto nu_val = value_of(nu);
+  auto mu_val = value_of(mu);
+  auto sigma_val = value_of(sigma);
+
+  check_nonnegative(function, "Degrees of freedom parameter", nu_val);
+  check_positive(function, "Scale parameter", sigma_val);
+  check_bounded(function, "Probability parameter", p_val, 0.0, 1.0);
+
+  if (unlikely(p_val == 0.0)) {
+    return FvarT{NEGATIVE_INFTY, 0.0};
+  } else if (unlikely(p_val == 1.0)) {
+    return FvarT{INFTY, 0.0};
+  } else if (unlikely(p_val == 0.5)) {
+    return FvarT{mu_val, 0.0};
+  }
+
+  const auto p_val_flip = p_val < 0.5 ? p_val : 1.0 - p_val;
+  const double p_sign = value_of_rec(p_val) < 0.5 ? -1.0 : 1.0;
+  auto sqrt_nu_val = sqrt(nu_val);
+  auto ibeta_arg = inv_inc_beta(0.5 * nu_val, 0.5, 2.0 * p_val_flip);
+  auto rtn_val
+      = mu_val
+        + p_sign * sigma_val * sqrt_nu_val * sqrt(-1.0 + 1.0 / ibeta_arg);
+
+  FvarT rtn(rtn_val, 0.0);
+
+  if constexpr (is_autodiff_v<T_p>) {
+    rtn.d_ += p.d_ * exp(-student_t_lpdf(rtn_val, nu_val, mu_val, sigma_val));
+  }
+
+  if constexpr (is_autodiff_v<T_nu>) {
+    const auto half_nu = nu_val / 2.0;
+    Eigen::Matrix<T_partials, -1, 1> hyper_arg_a{{0.5, half_nu, half_nu}};
+    Eigen::Matrix<T_partials, -1, 1> hyper_arg_b{
+        {1.0 + half_nu, 1.0 + half_nu}};
+    const auto hyper_arg
+        = hypergeometric_pFq(hyper_arg_a, hyper_arg_b, ibeta_arg);
+    const auto hyper2f1 = hypergeometric_2F1(1.0, (1.0 + nu_val) / 2.0,
+                                             (2.0 + nu_val) / 2.0, ibeta_arg);
+    const auto digamma_a1 = digamma(half_nu);
+    const auto digamma_a2 = digamma((1.0 + nu_val) / 2.0);
+
+    const auto arg_1 = (4.0 * hyper_arg * sqrt(1.0 - ibeta_arg)) / nu_val;
+    const auto arg_2 = -2.0 * hyper2f1 * (-1.0 + ibeta_arg)
+                       * (log(ibeta_arg) - digamma_a1 + digamma_a2);
+
+    const auto num1 = sigma_val * (-2.0 + (2.0 - arg_1 + arg_2) / ibeta_arg);
+    const auto den1 = 4.0 * sqrt_nu_val * sqrt(-1.0 + 1.0 / ibeta_arg);
+    rtn.d_ += nu.d_ * p_sign * num1 / den1;
+  }
+
+  if constexpr (is_autodiff_v<T_mu>) {
+    rtn.d_ += mu.d_;
+  }
+
+  if constexpr (is_autodiff_v<T_sigma>) {
+    rtn.d_ += sigma.d_ * p_sign * sqrt_nu_val * sqrt(-1.0 + 1.0 / ibeta_arg);
+  }
+
+  return rtn;
+}
+}  // namespace math
+}  // namespace stan
+
+#endif
diff --git a/stan/math/prim/fun/hypergeometric_pFq.hpp b/stan/math/prim/fun/hypergeometric_pFq.hpp
@@ -4,6 +4,7 @@
 #include <stan/math/prim/meta.hpp>
 #include <stan/math/prim/err/check_not_nan.hpp>
 #include <stan/math/prim/err/check_finite.hpp>
+#include <stan/math/prim/fun/to_ref.hpp>
 #include <stan/math/prim/fun/to_row_vector.hpp>
 #include <boost/math/special_functions/hypergeometric_pFq.hpp>
 
@@ -25,34 +26,53 @@ namespace math {
 template <typename Ta, typename Tb, typename Tz,
           require_all_vector_st<std::is_arithmetic, Ta, Tb>* = nullptr,
           require_arithmetic_t<Tz>* = nullptr>
-inline return_type_t<Ta, Tb, Tz> hypergeometric_pFq(const Ta& a, const Tb& b,
-                                                    const Tz& z) {
-  plain_type_t<Ta> a_ref = a;
-  plain_type_t<Tb> b_ref = b;
+inline return_type_t<Ta, Tb, Tz> hypergeometric_pFq(Ta&& a, Tb&& b, Tz&& z) {
+  decltype(auto) a_ref = to_ref(std::forward<Ta>(a));
+  decltype(auto) b_ref = to_ref(std::forward<Tb>(b));
   check_finite("hypergeometric_pFq", "a", a_ref);
   check_finite("hypergeometric_pFq", "b", b_ref);
   check_finite("hypergeometric_pFq", "z", z);
-
   check_not_nan("hypergeometric_pFq", "a", a_ref);
   check_not_nan("hypergeometric_pFq", "b", b_ref);
   check_not_nan("hypergeometric_pFq", "z", z);
 
-  bool condition_1 = (a_ref.size() > (b_ref.size() + 1)) && (z != 0);
-  bool condition_2 = (a_ref.size() == (b_ref.size() + 1)) && (std::fabs(z) > 1);
+  const bool condition_1 = (a_ref.size() > (b_ref.size() + 1)) && (z != 0);
+  const bool condition_2
+      = (a_ref.size() == (b_ref.size() + 1)) && (std::fabs(z) > 1);
 
   if (condition_1 || condition_2) {
-    std::stringstream msg;
-    msg << "hypergeometric function pFq does not meet convergence "
-        << "conditions with given arguments. "
-        << "a: " << to_row_vector(a_ref) << ", "
-        << "b: " << to_row_vector(b_ref) << ", "
-        << "z: " << z;
-    throw std::domain_error(msg.str());
+    [&]() STAN_COLD_PATH {
+      std::stringstream msg;
+      msg << "hypergeometric function pFq does not meet convergence "
+             "conditions with given arguments. "
+             "a: "
+          << to_row_vector(a_ref) << ", "
+          << "b: " << to_row_vector(b_ref) << ", "
+          << "z: " << z;
+      throw std::domain_error(msg.str());
+    }();
+  }
+  // For plain vectors, we can use Eigen's Map to avoid unnecessary copies
+  using a_ref_t = decltype(a_ref);
+  using b_ref_t = decltype(b_ref);
+  constexpr bool is_a_plain_vec
+      = std::is_same_v<std::decay_t<a_ref_t>, plain_type_t<a_ref_t>>;
+  constexpr bool is_b_plain_vec
+      = std::is_same_v<std::decay_t<b_ref_t>, plain_type_t<b_ref_t>>;
+  if constexpr (is_a_plain_vec && is_b_plain_vec) {
+    // We use type erasure not do a hard copy here
+    using map_t = Eigen::Map<Eigen::VectorXd>;
+    auto map_a = map_t(const_cast<double*>(a_ref.data()), a_ref.size());
+    auto map_b = map_t(const_cast<double*>(b_ref.data()), b_ref.size());
+    return boost::math::hypergeometric_pFq(map_a, map_b, z);
+  } else {
+    // We need pointers to `a` and `b`'s data here so we hard evaluate.
+    decltype(auto) a_eval = eval(a_ref);
+    decltype(auto) b_eval = eval(b_ref);
+    return boost::math::hypergeometric_pFq(
+        std::vector<double>(a_eval.data(), a_eval.data() + a_eval.size()),
+        std::vector<double>(b_eval.data(), b_eval.data() + b_eval.size()), z);
   }
-
-  return boost::math::hypergeometric_pFq(
-      std::vector<double>(a_ref.data(), a_ref.data() + a_ref.size()),
-      std::vector<double>(b_ref.data(), b_ref.data() + b_ref.size()), z);
 }
 }  // namespace math
 }  // namespace stan
diff --git a/stan/math/prim/meta.hpp b/stan/math/prim/meta.hpp
@@ -71,6 +71,7 @@
 #include <stan/math/prim/meta/ad_promotable.hpp>
 #include <stan/math/prim/meta/append_return_type.hpp>
 #include <stan/math/prim/meta/base_type.hpp>
+#include <stan/math/prim/meta/common_container_type.hpp>
 #include <stan/math/prim/meta/contains_std_vector.hpp>
 #include <stan/math/prim/meta/contains_tuple.hpp>
 #include <stan/math/prim/meta/error_index.hpp>
diff --git a/stan/math/prim/meta/common_container_type.hpp b/stan/math/prim/meta/common_container_type.hpp
@@ -0,0 +1,77 @@
+#ifndef STAN_MATH_PRIM_META_COMMON_CONTAINER_TYPE_HPP
+#define STAN_MATH_PRIM_META_COMMON_CONTAINER_TYPE_HPP
+
+#include <stan/math/prim/meta/is_container.hpp>
+#include <stan/math/prim/meta/is_tuple.hpp>
+#include <stan/math/prim/meta/is_detected.hpp>
+#include <stan/math/prim/meta/is_stan_scalar.hpp>
+#include <stan/math/prim/meta/is_var_matrix.hpp>
+#include <stan/math/prim/meta/plain_type.hpp>
+#include <stan/math/prim/meta/return_type.hpp>
+#include <stan/math/prim/meta/promote_scalar_type.hpp>
+#include <type_traits>
+
+namespace stan {
+namespace internal {
+template <typename T1, typename T2, typename = void, typename = void>
+struct common_container_type_impl;
+
+template <typename T1, typename T2>
+struct common_container_type_impl<T1, T2, require_stan_scalar_t<T1>,
+                                  require_stan_scalar_t<T2>> {
+  using type = return_type_t<T1, T2>;
+};
+
+template <typename T1, typename T2>
+struct common_container_type_impl<T1, T2, require_container_t<T1>,
+                                  require_container_t<T2>> {
+  using return_t = return_type_t<T1, T2>;
+  using container_type_1 = math::promote_scalar_t<return_t, plain_type_t<T1>>;
+  using container_type_2 = math::promote_scalar_t<return_t, plain_type_t<T2>>;
+  using type = std::conditional_t<
+      std::is_same<container_type_1, container_type_2>::value, container_type_1,
+      void>;
+};
+
+template <typename T1, typename T2>
+struct common_container_type_impl<T1, T2, require_stan_scalar_t<T1>,
+                                  require_container_t<T2>> {
+  using type = math::promote_scalar_t<return_type_t<T1, T2>, plain_type_t<T2>>;
+};
+
+template <typename T1, typename T2>
+struct common_container_type_impl<T1, T2, require_container_t<T1>,
+                                  require_stan_scalar_t<T2>> {
+  using type = math::promote_scalar_t<return_type_t<T1, T2>, plain_type_t<T1>>;
+};
+}  // namespace internal
+
+template <typename... Ts>
+struct common_container_type;
+
+template <typename T>
+struct common_container_type<T> {
+  using type = typename internal::common_container_type_impl<
+      T, double>::type;  // Use double for base case
+};
+
+/**
+ * Determine the common container type for a variadic list of types.
+ * If all types are scalars, then the common scalar type is returned.
+ * If all container types the same, but not necessarily the same scalar type,
+ * the common container type with the common scalar type is returned.
+ *
+ * If different container types are present, the result is `void`.
+ */
+template <typename T1, typename... Ts>
+struct common_container_type<T1, Ts...> {
+  using type = typename internal::common_container_type_impl<
+      T1, typename common_container_type<Ts...>::type>::type;
+};
+
+template <typename... Ts>
+using common_container_t = typename common_container_type<Ts...>::type;
+
+}  // namespace stan
+
+#endif  // STAN_MATH_PRIM_META_PLAIN_TYPE_HPP
diff --git a/stan/math/prim/prob.hpp b/stan/math/prim/prob.hpp
@@ -287,6 +287,7 @@
 #include <stan/math/prim/prob/student_t_lccdf.hpp>
 #include <stan/math/prim/prob/student_t_lcdf.hpp>
 #include <stan/math/prim/prob/student_t_lpdf.hpp>
+#include <stan/math/prim/prob/student_t_qf.hpp>
 #include <stan/math/prim/prob/student_t_rng.hpp>
 #include <stan/math/prim/prob/uniform_ccdf_log.hpp>
 #include <stan/math/prim/prob/uniform_cdf.hpp>
diff --git a/stan/math/prim/prob/student_t_qf.hpp b/stan/math/prim/prob/student_t_qf.hpp
@@ -0,0 +1,98 @@
+#ifndef STAN_MATH_PRIM_PROB_STUDENT_T_QF_HPP
+#define STAN_MATH_PRIM_PROB_STUDENT_T_QF_HPP
+
+#include <stan/math/prim/meta.hpp>
+#include <stan/math/prim/err.hpp>
+#include <stan/math/prim/fun/sqrt.hpp>
+#include <stan/math/prim/fun/inv_inc_beta.hpp>
+#include <stan/math/prim/fun/max_size.hpp>
+
+namespace stan {
+namespace math {
+
+/**
+ * The quantile function of the Student's t-distribution.
+ *
+ * @tparam T_p type of the probability parameter
+ * @tparam T_nu type of the degrees of freedom parameter
+ * @tparam T_mu type of the location parameter
+ * @tparam T_sigma type of the scale parameter
+ * @param p Probability in the range [0, 1].
+ * @param nu Degrees of freedom, must be non-negative.
+ * @param mu Location parameter.
+ * @param sigma Scale parameter, must be positive.
+ * @return Quantile function value.
+ * @throw std::domain_error if `nu` is negative or `sigma` is not positive,
+ * or if `p` is not in [0, 1].
+ */
+template <typename T_p, typename T_nu, typename T_mu, typename T_sigma,
+          require_all_stan_scalar_t<T_p, T_nu, T_mu, T_sigma>* = nullptr,
+          require_all_arithmetic_t<T_p, T_nu, T_mu, T_sigma>* = nullptr>
+inline double student_t_qf(const T_p& p, const T_nu& nu, const T_mu& mu,
+                           const T_sigma& sigma) {
+  static constexpr const char* function = "student_t_qf";
+  check_nonnegative(function, "Degrees of freedom parameter", nu);
+  check_positive(function, "Scale parameter", sigma);
+  check_bounded(function, "Probability parameter", p, 0.0, 1.0);
+
+  if (p == 0.0) {
+    return NEGATIVE_INFTY;
+  } else if (p == 1.0) {
+    return INFTY;
+  } else if (p == 0.5) {
+    return mu;
+  }
+
+  const double p_val_flip = p < 0.5 ? p : 1.0 - p;
+  const double p_sign = p < 0.5 ? -1.0 : 1.0;
+  const auto ibeta_arg = inv_inc_beta(0.5 * nu, 0.5, 2 * p_val_flip);
+
+  return mu + p_sign * sigma * sqrt(nu) * sqrt(-1.0 + 1.0 / ibeta_arg);
+}
+
+/**
+ * A vectorized version of the Student's t quantile function that accepts
+ * std::vectors, Eigen Matrix/Array objects, or expressions, and containers of
+ * these.
+ *
+ * @tparam T_p type of the probability parameter
+ * @tparam T_nu type of the degrees of freedom parameter
+ * @tparam T_mu type of the location parameter
+ * @tparam T_sigma type of the scale parameter
+ * @tparam T_container type of the container to hold results
+ * @param p Probability in the range [0, 1].
+ * @param nu Degrees of freedom, must be non-negative.
+ * @param mu Location parameter.
+ * @param sigma Scale parameter, must be positive.
+ * @return Container with quantile function values for each input.
+ */
+template <typename T_p, typename T_nu, typename T_mu, typename T_sigma,
+          require_any_vector_t<T_p, T_nu, T_mu, T_sigma>* = nullptr>
+inline auto student_t_qf(const T_p& p, const T_nu& nu, const T_mu& mu,
+                         const T_sigma& sigma) {
+  using T_container = common_container_t<T_p, T_nu, T_mu, T_sigma>;
+  static constexpr const char* function = "student_t_qf";
+  const size_t max_size_all = max_size(p, nu, mu, sigma);
+  T_container result(max_size_all);
+
+  ref_type_t<T_p> p_ref = p;
+  ref_type_t<T_nu> nu_ref = nu;
+  ref_type_t<T_mu> mu_ref = mu;
+  ref_type_t<T_sigma> sigma_ref = sigma;
+
+  scalar_seq_view<ref_type_t<T_p>> p_vec(p_ref);
+  scalar_seq_view<ref_type_t<T_nu>> nu_vec(nu_ref);
+  scalar_seq_view<ref_type_t<T_mu>> mu_vec(mu_ref);
+  scalar_seq_view<ref_type_t<T_sigma>> sigma_vec(sigma_ref);
+
+  for (size_t i = 0; i < max_size_all; ++i) {
+    result[i] = student_t_qf(p_vec[i], nu_vec[i], mu_vec[i], sigma_vec[i]);
+  }
+
+  return result;
+}
+
+}  // namespace math
+}  // namespace stan
+
+#endif
diff --git a/stan/math/rev/fun/hypergeometric_pFq.hpp b/stan/math/rev/fun/hypergeometric_pFq.hpp
@@ -23,14 +23,16 @@ namespace math {
  * @return Generalized hypergeometric function
  */
 template <typename Ta, typename Tb, typename Tz,
-          bool grad_a = is_autodiff_v<Ta>, bool grad_b = is_autodiff_v<Tb>,
-          bool grad_z = is_autodiff_v<Tz>,
           require_all_vector_t<Ta, Tb>* = nullptr,
           require_return_type_t<is_var, Ta, Tb, Tz>* = nullptr>
 inline var hypergeometric_pFq(Ta&& a, Tb&& b, Tz&& z) {
-  auto&& arena_a = to_arena(as_column_vector_or_scalar(std::forward<Ta>(a)));
-  auto&& arena_b = to_arena(as_column_vector_or_scalar(std::forward<Tb>(b)));
-  auto pfq_val = hypergeometric_pFq(arena_a.val(), arena_b.val(), value_of(z));
+  constexpr bool grad_a = is_autodiff_v<Ta>;
+  constexpr bool grad_b = is_autodiff_v<Tb>;
+  constexpr bool grad_z = is_autodiff_v<Tz>;
+  auto arena_a = to_arena(as_column_vector_or_scalar(std::forward<Ta>(a)));
+  auto arena_b = to_arena(as_column_vector_or_scalar(std::forward<Tb>(b)));
+  auto pfq_val
+      = hypergeometric_pFq(value_of(arena_a), value_of(arena_b), value_of(z));
   return make_callback_var(
       pfq_val, [arena_a, arena_b, z, pfq_val](auto& vi) mutable {
         auto grad_tuple = grad_pFq<grad_a, grad_b, grad_z>(
diff --git a/stan/math/rev/prob.hpp b/stan/math/rev/prob.hpp
diff --git a/stan/math/rev/prob/student_t_qf.hpp b/stan/math/rev/prob/student_t_qf.hpp
diff --git a/test/unit/math/mix/prob/student_t_qf_test.cpp b/test/unit/math/mix/prob/student_t_qf_test.cpp
diff --git a/test/unit/math/prim/prob/student_t_qf_test.cpp b/test/unit/math/prim/prob/student_t_qf_test.cpp