tatooine/solve_8h_source.html

#ifndef TATOOINE_TENSOR_OPERATIONS_SOLVE_H

#define TATOOINE_TENSOR_OPERATIONS_SOLVE_H

//==============================================================================

#include <tatooine/tensor_concepts.h>

#include <tatooine/tensor_operations/determinant.h>

#include <tatooine/utility.h>


#include <cstdint>

//==============================================================================

namespace tatooine {

//==============================================================================

auto copy_or_keep_if_rvalue_tensor_solve(dynamic_tensor auto&& x) -> decltype(auto) {

  return tensor<tatooine::value_type<decltype(x)>>{std::forward<decltype(x)>(x)};

}

template <typename T>

auto copy_or_keep_if_rvalue_tensor_solve(tensor<T>&& x) -> decltype(auto) {

  return std::move(x);

}

template <typename T, std::size_t... Dims>

auto copy_or_keep_if_rvalue_tensor_solve(tensor<T, Dims...>&& x) -> decltype(auto) {

  return std::move(x);

}

template <typename T>

auto copy_or_keep_if_rvalue_tensor_solve(tensor<T> const& x) {

  return tensor<T>{x};

}

template <typename T, std::size_t... Dims>

auto copy_or_keep_if_rvalue_tensor_solve(tensor<T, Dims...> const& x) {

  return tensor<T, Dims...>{x};

}

template <fixed_size_quadratic_mat<2> MatA, static_mat MatB>

requires(tensor_dimension<MatB, 0> == 2)

auto constexpr solve_direct(MatA&& A, MatB&& B) {

  using out_value_type =

      common_type<tatooine::value_type<MatA>, tatooine::value_type<MatB>>;

  auto constexpr K = tensor_dimension<MatB, 1>;


  using out_mat_type = mat<out_value_type, 2, K>;

  using out_type     = std::optional<out_mat_type>;


  auto const div   = (A(0, 0) * A(1, 1) - A(1, 0) * A(0, 1));

  if (div == 0) {

    return out_type{std::nullopt};

  }

  auto const p = 1 / div;

  auto       X = out_type{out_mat_type{}};

  for (std::size_t i = 0; i < K; ++i) {

    X->at(0, i) = -(A(0, 1) * B(1, i) - A(1, 1) * B(0, i)) * p;

    X->at(1, i) = (A(0, 0) * B(1, i) - A(1, 0) * B(0, i)) * p;

  }

  return X;

}

// - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

template <fixed_size_mat<2, 2> MatA, fixed_size_vec<2> VecB>

auto solve_direct(MatA&& A, VecB&& b) -> std::optional<

    vec<common_type<tatooine::value_type<MatA>, tatooine::value_type<VecB>>, 2>> {

  using out_value_type =

      common_type<tatooine::value_type<MatA>, tatooine::value_type<VecB>>;

  auto const div = (A(0, 0) * A(1, 1) - A(1, 0) * A(0, 1));

  if (div == 0) {

    return std::nullopt;

  }

  auto const p = 1 / div;

  return vec<out_value_type, 2>{-(A(0, 1) * b(1) - A(1, 1) * b(0)) * p,

                                (A(0, 0) * b(1) - A(1, 0) * b(0)) * p};

}

//------------------------------------------------------------------------------

template <static_quadratic_mat MatA, static_vec VecB>

requires(tensor_dimension<MatA, 0> ==

         tensor_dimension<VecB, 0>)

auto solve_cramer(MatA const& A, VecB const& b) -> std::optional<

    vec<common_type<tatooine::value_type<MatA>, tatooine::value_type<VecB>>,

        tensor_dimension<MatA, 1>>> {

  static constexpr auto N = tensor_dimension<MatA, 1>;

  using out_value_type =

      common_type<tatooine::value_type<MatA>, tatooine::value_type<VecB>>;

  auto const det_inv = 1 / det(A);

  auto       Y       = mat<out_value_type, N, N>{A};

  auto       tmp     = vec<out_value_type, N>{};

  auto       result  = vec<out_value_type, N>{};

  for (std::size_t i = 0; i < N; ++i) {

    tmp       = Y.col(i);

    Y.col(i)  = b;

    result(i) = det(Y) * det_inv;

    Y.col(i)  = tmp;

  }

  return result;

}

//------------------------------------------------------------------------------

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

template <static_quadratic_mat MatA, static_vec VecB>

requires(tensor_dimension<MatA, 1> ==

         tensor_dimension<VecB, 0>)

auto solve_lu_lapack(MatA& A_, VecB&& b_)

    -> std::optional<

        tensor<common_type<tatooine::value_type<MatA>, tatooine::value_type<VecB>>>> {

  using common_type =

      common_type<tatooine::value_type<MatA>, tatooine::value_type<VecB>>;

  static constexpr auto M    = tensor_dimension<MatA, 0>;

  static constexpr auto N    = tensor_dimension<MatA, 1>;

  auto                  A    = tensor<common_type, M, N>{A_};

  auto                  b    = tensor<common_type, N>{b_};

  auto                  ipiv = vec<int, N>{};

  [[maybe_unused]] auto info = lapack::gesv(A, b, ipiv);

  if (info != 0) {

    return std::nullopt;

  }

  return b;

}

#endif

// - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

template <static_quadratic_mat MatA, static_mat MatB>

requires(tensor_dimension<MatA, 0> == tensor_dimension<MatB, 0>)

auto solve_lu_lapack(MatA& A_, MatB& B_)  {

  using out_value_type =

      common_type<tatooine::value_type<MatA>, tatooine::value_type<MatB>>;

  static constexpr auto N = tensor_dimension<MatA, 1>;

  static constexpr auto K = tensor_dimension<MatB, 1>;

  using out_mat_type         = mat<out_value_type, N, K>;

  using out_type             = std::optional<out_mat_type>;

  auto                  A    = mat<out_value_type, N, N>{A_};

  auto                  B    = out_type{B_};

  auto                  ipiv = vec<int, N>{};

  [[maybe_unused]] auto info = lapack::gesv(A, *B, ipiv);

  if (info != 0) {

    return out_type{std::nullopt};

  }

  return B;

}

#endif

//------------------------------------------------------------------------------

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

template <static_mat MatA, static_mat MatB>

requires(tensor_dimension<MatA, 0> == tensor_dimension<MatB, 0>)

auto solve_qr_lapack(MatA&& A_, MatB&& B_) {

  using out_value_type =

      common_type<tatooine::value_type<MatA>, tatooine::value_type<MatB>>;

  static auto constexpr M = tensor_dimension<MatA, 0>;

  static auto constexpr N = tensor_dimension<MatA, 1>;

  static auto constexpr K = tensor_dimension<MatB, 1>;

  using mat_out_type      = mat<out_value_type, N, K>;

  using out_type = std::optional<mat_out_type>;


  auto A   = mat<out_value_type, M, N>{A_};

  auto B   = mat<out_value_type, M, K>{B_};

  auto tau = vec<out_value_type, (M < N ? M : N)>{};


  // Q * R = A

  if (lapack::geqrf(A, tau) != 0) {

    return out_type{std::nullopt};

  }

  // R * x = Q^T * B

  if (lapack::ormqr(A, B, tau, lapack::side::left, lapack::op::transpose) !=

      0) {

    return out_type{std::nullopt};

  }

  // Use back-substitution using the upper right part of A

  if (lapack::trtrs(A, B, lapack::uplo::upper, lapack::op::no_transpose,

                    lapack::diag::non_unit)) {

    return out_type{std::nullopt};

  }

  auto X = out_type{mat_out_type{}};

  for_loop([&, i = std::size_t(0)](

               auto const... is) mutable { X->at(is...) = B(is...); },

           N, K);

  return X;

}

#endif

// - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

template <static_mat MatA, static_vec VecB>

requires (tensor_dimension<MatA, 0> == tensor_dimension<VecB, 0>)

auto solve_qr_lapack(MatA&& A_, VecB&& b_) {

  using out_value_type =

      common_type<tatooine::value_type<MatA>, tatooine::value_type<VecB>>;

  static auto constexpr M = tensor_dimension<MatA, 0>;

  static auto constexpr N = tensor_dimension<MatA, 1>;

  auto A                  = mat<out_value_type, M, N>{A_};

  auto b                  = vec<out_value_type, M>{b_};

  using out_vec_type      = vec<out_value_type, (M < N ? M : N)>;

  using out_type          = std::optional<out_vec_type>;

  auto tau                = out_type{out_vec_type{}};


  // Q * R = A

  if (lapack::geqrf(A, *tau) != 0) {

    return out_type{std::nullopt};

  }

  // R * x = Q^T * b

  if (lapack::ormqr(A, b, *tau, lapack::side::left, lapack::op::transpose) != 0) {

    return out_type{std::nullopt};

  }

  // Use back-substitution using the upper right part of A

  if (lapack::trtrs(A, b, lapack::uplo::upper, lapack::op::no_transpose,

                lapack::diag::non_unit) != 0) {

    return out_type{std::nullopt};

  }

  for (std::size_t i = 0; i < tau->dimension(0); ++i) {

    tau->at(i) = b(i);

  }

  return tau;

}

#endif

//------------------------------------------------------------------------------

template <static_mat MatA, static_mat MatB>

requires (tensor_dimension<MatA, 0> == tensor_dimension<MatB, 0>)

auto solve(MatA&& A, MatB&& B) {

  static auto constexpr M = tensor_dimension<MatA, 0>;

  static auto constexpr N = tensor_dimension<MatA, 1>;

  static auto constexpr K = tensor_dimension<MatB, 1>;

  if constexpr (M == 2 && N == 2 && K >= M) {

    return solve_direct(std::forward<MatA>(A), std::forward<MatB>(B));

  } else if constexpr (M == N) {

    return solve_lu_lapack(std::forward<MatA>(A), std::forward<MatB>(B));

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

    throw std::runtime_error{

        "cannot do a LU-factorization because LAPACK is missing"};

#endif


  } else if constexpr (M > N) {

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

    return solve_qr_lapack(std::forward<MatA>(A), std::forward<MatB>(B));

#else

    throw std::runtime_error{

        "cannot do a QR-factorization because LAPACK is missing"};

#endif


  } else {

    throw std::runtime_error{"System is under-determined."};

  }

}

//------------------------------------------------------------------------------

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

template <dynamic_tensor TensorA, dynamic_tensor TensorB>

auto solve_lu_lapack(TensorA&& A_, TensorB&& B_) -> std::optional<tensor<

    common_type<tatooine::value_type<TensorA>, tatooine::value_type<TensorB>>>> {

  assert(A_.rank() == 2);

  assert(A_.dimension(0) == A_.dimension(1));

  assert(A_.dimension(0) == B_.dimension(0));

  assert(B_.rank() == 1 || B_.rank() == 2);

  auto ipiv   = tensor<int>::zeros(A_.dimension(0));

  if constexpr (same_as<tatooine::value_type<TensorA>,

                        tatooine::value_type<TensorB>>) {

    decltype(auto) A =

        copy_or_keep_if_rvalue_tensor_solve(std::forward<TensorA>(A_));

    decltype(auto) B =

        copy_or_keep_if_rvalue_tensor_solve(std::forward<TensorB>(B_));

    if (auto const info = lapack::gesv(A, B, ipiv); info != 0) {

      return std::nullopt;

    }

    return std::forward<decltype(B)>(B);

  } else {

    using out_value_type =

        common_type<tatooine::value_type<TensorA>, tatooine::value_type<TensorB>>;

    auto A = tensor<out_value_type>{A_};

    auto B = tensor<out_value_type>{B_};

    if (lapack::gesv(A, B, ipiv) != 0) {

      return std::nullopt;

    }

    return B;

  }

}

#endif

//------------------------------------------------------------------------------

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

template <dynamic_tensor TensorA, dynamic_tensor TensorB>

auto solve_qr_lapack(TensorA&& A_, TensorB&& B_)

    -> std::optional<tensor<

        common_type<tatooine::value_type<TensorA>, tatooine::value_type<TensorB>>>> {

  using out_value_type =

      common_type<tatooine::value_type<TensorA>, tatooine::value_type<TensorB>>;

  assert(A_.rank() == 2);

  assert(B_.rank() == 1 || B_.rank() == 2);

  assert(A_.dimension(0) == B_.dimension(0));

  auto A = copy_or_keep_if_rvalue_tensor_solve(A_);

  auto B = copy_or_keep_if_rvalue_tensor_solve(B_);

  auto const M   = A.dimension(0);

  auto const N   = A.dimension(1);

  auto const K   = (B.rank() == 1 ? 1 : B.dimension(1));

  auto       tau = tensor<out_value_type>{min(M, N)};

  auto       X   = K > 1 ? tensor<out_value_type>{N, K} : tensor<out_value_type>{N};


  // Q * R = A

  if (lapack::geqrf(A, tau) != 0) {

    return std::nullopt;

  }

  // R * x = Q^T * B

  if (lapack::ormqr(A, B, tau, lapack::side::left, lapack::op::transpose) !=

      0) {

    return std::nullopt;

  }

  // Use back-substitution using the upper right part of A

  if (lapack::trtrs(A, B, lapack::uplo::upper, lapack::op::no_transpose,

                    lapack::diag::non_unit) != 0) {

    return std::nullopt;

  }

  for_loop(

      [&](auto const i, auto const j) {

        if (B.rank() == 1) {

          X(i) = B(i);

        } else {

          X(i, j) = B(i, j);

        }

      },

      N, K);

  return X;

}

#endif

// - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -

template <static_mat MatA, static_vec VecB>

requires (tensor_dimension<MatA, 0> == tensor_dimension<VecB, 0>)

auto solve(MatA&& A, VecB&& b) {

  static auto constexpr M = tensor_dimension<MatA, 0>;

  static auto constexpr N = tensor_dimension<MatA, 1>;

  if constexpr (M == 2 && N == 2) {

    return solve_direct(std::forward<MatA>(A), std::forward<VecB>(b));

  } else if constexpr (M == 3 && N == 3) {

    return solve_cramer(std::forward<MatA>(A), std::forward<VecB>(b));

  } else if constexpr (M == N) {

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

    return solve_lu_lapack(std::forward<MatA>(A), std::forward<VecB>(b));

#else

    throw std::runtime_error{

        "cannot do a LU-factorization because LAPACK is missing"};

#endif

  } else if constexpr (M > N) {

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

    return solve_qr_lapack(std::forward<MatA>(A), std::forward<VecB>(b));

#else

    throw std::runtime_error{

        "cannot do a QR-factorization because LAPACK is missing"};

#endif

  } else {

    throw std::runtime_error{"System is under-determined."};

  }

}

//==============================================================================

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

template <dynamic_tensor TensorA, dynamic_tensor TensorB>

auto solve_symmetric_lapack(TensorA&& A_, TensorB&& B_,

                            lapack::uplo uplo = lapack::uplo::lower)

    -> std::optional<tensor<common_type<tatooine::value_type<decltype(A_)>,

                                        tatooine::value_type<decltype(B_)>>>> {

  // assert A is quadratic matrix

  assert(A_.rank() == 2);

  assert(A_.dimension(0) == A_.dimension(1));


  // assert B is vector or matrix

  assert(B_.rank() == 1 || B_.rank() == 2);

  // assert B dimensions are correct

  assert(B_.dimension(0) == A_.dimension(0));

  if constexpr (same_as<tatooine::value_type<decltype(A_)>,

                        tatooine::value_type<decltype(B_)>>) {

    decltype(auto) A = copy_or_keep_if_rvalue_tensor_solve(A_);

    decltype(auto) B = copy_or_keep_if_rvalue_tensor_solve(B_);


    auto const info = lapack::sysv(A, B, uplo);

    if (info > 0) {

      std::cerr

          << "[lapack::sysv]\n  D(" << info << ", " << info

          << ") is exactly zero. The factorization has been completed, but the "

             "block diagonal matrix D is exactly singular, so the solution "

             "could "

             "not be computed.\n";

    } else if (info < 0) {

      std::cerr << "[lapack::sysv]\n  Parameter " << -info << " is wrong.\n";

    }

    if (info != 0) {

      return std::nullopt;

    }

    return std::forward<decltype(B)>(B);

  } else {

    using T = common_type<tatooine::value_type<decltype(A_)>,

                          tatooine::value_type<decltype(B_)>>;

    auto A = tensor<T>{A_};

    auto B = tensor<T>{B_};


    auto const info = lapack::sysv(A, B, uplo);

    if (info > 0) {

      std::cerr

          << "[lapack::sysv]\n  D(" << info << ", " << info

          << ") is exactly zero. The factorization has been completed, but the "

             "block diagonal matrix D is exactly singular, so the solution "

             "could "

             "not be computed.\n";

    } else if (info < 0) {

      std::cerr << "[lapack::sysv]\n  Parameter " << -info << " is wrong.\n";

    }

    if (info != 0) {

      return std::nullopt;

    }

    return B;

  }

}

#endif

//==============================================================================

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

//auto solve_symmetric_lapack_aa(dynamic_tensor auto&& A_, dynamic_tensor auto&& B_,

//                            lapack::uplo uplo = lapack::uplo::lower)

//    -> std::optional<tensor<common_type<tatooine::value_type<decltype(A_)>,

//                                        tatooine::value_type<decltype(B_)>>>> {

//  // assert A is quadratic matrix

//  assert(A_.rank() == 2);

//  assert(A_.dimension(0) == A_.dimension(1));

//

//  // assert B is vector or matrix

//  assert(B_.rank() == 1 || B_.rank() == 2);

//  // assert B dimensions are correct

//  assert(B_.dimension(0) == A_.dimension(0));

//  if constexpr (same_as<tatooine::value_type<decltype(A_)>,

//                        tatooine::value_type<decltype(B_)>>) {

//    decltype(auto) A = copy_or_keep_if_rvalue_tensor_solve(A_);

//    decltype(auto) B = copy_or_keep_if_rvalue_tensor_solve(B_);

//

//    auto const info = lapack::sysv_aa(A, B, uplo);

//    if (info > 0) {

//      std::cerr

//          << "[lapack::sysv_aa]\n  D(" << info << ", " << info

//          << ") is exactly zero. The factorization has been completed, but the "

//             "block diagonal matrix D is exactly singular, so the solution "

//             "could "

//             "not be computed.\n";

//    } else if (info < 0) {

//      std::cerr << "[lapack::sysv_aa]\n  Parameter " << -info << " is wrong.\n";

//    }

//    if (info != 0) {

//      return std::nullopt;

//    }

//    return std::forward<decltype(B)>(B);

//  } else {

//    using T = common_type<tatooine::value_type<decltype(A_)>,

//                          tatooine::value_type<decltype(B_)>>;

//    auto A = tensor<T>{A_};

//    auto B = tensor<T>{B_};

//

//    auto const info = lapack::sysv_aa(A, B, uplo);

//    if (info > 0) {

//      std::cerr

//          << "[lapack::sysv_aa]\n  D(" << info << ", " << info

//          << ") is exactly zero. The factorization has been completed, but the "

//             "block diagonal matrix D is exactly singular, so the solution "

//             "could "

//             "not be computed.\n";

//    } else if (info < 0) {

//      std::cerr << "[lapack::sysv_aa]\n  Parameter " << -info << " is wrong.\n";

//    }

//    if (info != 0) {

//      return std::nullopt;

//    }

//    return B;

//  }

//}

#endif

//==============================================================================

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

//auto solve_symmetric_lapack_rk(dynamic_tensor auto&& A_,

//                               dynamic_tensor auto&& B_,

//                               lapack::uplo          uplo = lapack::uplo::lower)

//    -> std::optional<tensor<common_type<tatooine::value_type<decltype(A_)>,

//                                        tatooine::value_type<decltype(B_)>>>> {

//  // assert A is quadratic matrix

//  assert(A_.rank() == 2);

//  assert(A_.dimension(0) == A_.dimension(1));

//

//  // assert B is vector or matrix

//  assert(B_.rank() == 1 || B_.rank() == 2);

//  // assert B dimensions are correct

//  assert(B_.dimension(0) == A_.dimension(0));

//  if constexpr (same_as<tatooine::value_type<decltype(A_)>,

//                        tatooine::value_type<decltype(B_)>>) {

//    decltype(auto) A = copy_or_keep_if_rvalue_tensor_solve(A_);

//    decltype(auto) B = copy_or_keep_if_rvalue_tensor_solve(B_);

//

//    auto const info = lapack::sysv_rk(A, B, uplo);

//    if (info > 0) {

//      std::cerr

//          << "[lapack::sysv_rk]\n  D(" << info << ", " << info

//          << ") is exactly zero. The factorization has been completed, but the "

//             "block diagonal matrix D is exactly singular, so the solution "

//             "could "

//             "not be computed.\n";

//    } else if (info < 0) {

//      std::cerr << "[lapack::sysv_rk]\n  Parameter " << -info << " is wrong.\n";

//    }

//    if (info != 0) {

//      return std::nullopt;

//    }

//    return std::forward<decltype(B)>(B);

//  } else {

//    using T = common_type<tatooine::value_type<decltype(A_)>,

//                          tatooine::value_type<decltype(B_)>>;

//    auto A = tensor<T>{A_};

//    auto B = tensor<T>{B_};

//

//    auto const info = lapack::sysv_rk(A, B, uplo);

//    if (info > 0) {

//      std::cerr

//          << "[lapack::sysv_rk]\n  D(" << info << ", " << info

//          << ") is exactly zero. The factorization has been completed, but the "

//             "block diagonal matrix D is exactly singular, so the solution "

//             "could "

//             "not be computed.\n";

//    } else if (info < 0) {

//      std::cerr << "[lapack::sysv_rk]\n  Parameter " << -info << " is wrong.\n";

//    }

//    if (info != 0) {

//      return std::nullopt;

//    }

//    return B;

//  }

//}

#endif

//------------------------------------------------------------------------------

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

auto solve_symmetric(dynamic_tensor auto&& A, dynamic_tensor auto&& B) {

  return solve_symmetric_lapack(std::forward<decltype(A)>(A),

                                std::forward<decltype(B)>(B));

}

#endif

//------------------------------------------------------------------------------

template <dynamic_tensor TensorA, dynamic_tensor TensorB>

auto solve(TensorA&& A, TensorB&& B) -> std::optional<tensor<

    common_type<tatooine::value_type<TensorB>, tatooine::value_type<TensorB>>>> {

  assert(A.rank() == 2);

  assert(B.rank() == 1 || B.rank() == 2);

  assert(B.dimension(0) == A.dimension(0));

  auto const M = A.dimension(0);

  auto const N = A.dimension(1);

  if (M == N) {

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

    return solve_lu_lapack(std::forward<decltype(A)>(A),

                           std::forward<decltype(B)>(B));

#else

    throw std::runtime_error{

        "cannot do a LU-factorization because LAPACK is missing"};

#endif

  } else if (M > N) {

#if TATOOINE_BLAS_AND_LAPACK_AVAILABLE

    return solve_qr_lapack(std::forward<decltype(A)>(A),

                           std::forward<decltype(B)>(B));

#else

    throw std::runtime_error{

        "cannot do a QR-factorization because LAPACK is missing"};

#endif

  }

  throw std::runtime_error{"System is under-determined."};

}

//==============================================================================

}  // namespace tatooine

//==============================================================================

#endif

tatooine::dynamic_tensor
Definition: tensor_concepts.h:17

tatooine::same_as
Definition: concepts.h:15

determinant.h

tatooine::lapack::gesv
auto gesv(int N, int NRHS, Float *A, int LDA, int *IPIV, Float *B, int LDB) -> int
Definition: gesv.h:38

tatooine::lapack::sysv
auto sysv(uplo u, int N, int NRHS, Float *A, int LDA, int *IPIV, Float *B, int LDB, Float *WORK, int LWORK) -> int
Definition: sysv.h:39

utility.h

tatooine::blas::uplo::upper
@ upper

tatooine::blas::uplo::lower
@ lower

tatooine::blas::diag::non_unit
@ non_unit

tatooine::blas::op::transpose
@ transpose

tatooine::blas::op::no_transpose
@ no_transpose

tatooine::lapack::geqrf
auto geqrf(int M, int N, Float *A, int LDA, Float *TAU, Float *WORK, int LWORK) -> int
Definition: geqrf.h:18

tatooine::lapack::trtrs
auto trtrs(uplo u, op t, diag d, int N, int NRHS, Float *A, int LDA, Float *B, int LDB) -> int
Definition: trtrs.h:18

tatooine::lapack::ormqr
auto ormqr(side SIDE, op TRANS, int M, int N, int K, Float *A, int LDA, Float *TAU, Float *C, int LDC, Float *WORK, int LWORK) -> int
Definition: ormqr.h:21

tatooine
Definition: algorithm.h:6

tatooine::solve_symmetric
auto solve_symmetric(dynamic_tensor auto &&A, dynamic_tensor auto &&B)
Definition: solve.h:549

tatooine::common_type
typename common_type_impl< Ts... >::type common_type
Definition: common_type.h:23

tatooine::copy_or_keep_if_rvalue_tensor_solve
auto copy_or_keep_if_rvalue_tensor_solve(dynamic_tensor auto &&x) -> decltype(auto)
Definition: solve.h:12

tatooine::solve_direct
auto constexpr solve_direct(MatA &&A, MatB &&B)
Definition: solve.h:33

tatooine::value_type
typename value_type_impl< T >::type value_type
Definition: type_traits.h:280

tatooine::solve_symmetric_lapack
auto solve_symmetric_lapack(TensorA &&A_, TensorB &&B_, lapack::uplo uplo=lapack::uplo::lower) -> std::optional< tensor< common_type< tatooine::value_type< decltype(A_)>, tatooine::value_type< decltype(B_)> > > >
Definition: solve.h:349

tatooine::solve
auto solve(polynomial< Real, 1 > const &p) -> std::vector< Real >
solve a + b*x
Definition: polynomial.h:187

tatooine::solve_lu_lapack
auto solve_lu_lapack(MatA &A_, VecB &&b_) -> std::optional< tensor< common_type< tatooine::value_type< MatA >, tatooine::value_type< VecB > > > >
Definition: solve.h:94

tatooine::solve_qr_lapack
auto solve_qr_lapack(MatA &&A_, MatB &&B_)
Definition: solve.h:136

tatooine::min
constexpr auto min(A &&a, B &&b)
Definition: math.h:15

tatooine::for_loop
constexpr auto for_loop(Iteration &&iteration, execution_policy::sequential_t, Ranges(&&... ranges)[2]) -> void
Use this function for creating a sequential nested loop.
Definition: for_loop.h:336

tatooine::det
constexpr auto det(base_tensor< Tensor, T, 2, 2 > const &A) -> T
Definition: determinant.h:7

tatooine::solve_cramer
auto solve_cramer(MatA const &A, VecB const &b) -> std::optional< vec< common_type< tatooine::value_type< MatA >, tatooine::value_type< VecB > >, tensor_dimension< MatA, 1 > > >
Definition: solve.h:71

tatooine::base_uniform_tree_hierarchy::dim::left
@ left
Definition: uniform_tree_hierarchy.h:18

tatooine::mat
Definition: mat.h:14

tatooine::tensor
Definition: tensor.h:17

tatooine::tensor::zeros
static constexpr auto zeros()
Definition: tensor.h:144

tatooine::vec
Definition: vec.h:12

tensor_concepts.h