#include "relapack.h" static void RELAPACK_clauum_rec(const char *, const blasint *, float *, const blasint *, blasint *); /** CLAUUM computes the product U * U**H or L**H * L, where the triangular factor U or L is stored in the upper or lower triangular part of the array A. * * This routine is functionally equivalent to LAPACK's clauum. * For details on its interface, see * http://www.netlib.org/lapack/explore-html/d2/d36/clauum_8f.html * */ void RELAPACK_clauum( const char *uplo, const blasint *n, float *A, const blasint *ldA, blasint *info ) { // Check arguments const blasint lower = LAPACK(lsame)(uplo, "L"); const blasint upper = LAPACK(lsame)(uplo, "U"); *info = 0; if (!lower && !upper) *info = -1; else if (*n < 0) *info = -2; else if (*ldA < MAX(1, *n)) *info = -4; if (*info) { const blasint minfo = -*info; LAPACK(xerbla)("CLAUUM", &minfo, strlen("CLAUUM")); return; } if (*n == 0) return; // Clean char * arguments const char cleanuplo = lower ? 'L' : 'U'; // Recursive kernel RELAPACK_clauum_rec(&cleanuplo, n, A, ldA, info); } /** clauum's recursive compute kernel */ static void RELAPACK_clauum_rec( const char *uplo, const blasint *n, float *A, const blasint *ldA, blasint *info ) { if (*n <= MAX(CROSSOVER_CLAUUM, 1)) { // Unblocked LAPACK(clauu2)(uplo, n, A, ldA, info); return; } // Constants const float ONE[] = { 1., 0. }; // Splitting const blasint n1 = CREC_SPLIT(*n); const blasint n2 = *n - n1; // A_TL A_TR // A_BL A_BR float *const A_TL = A; float *const A_TR = A + 2 * *ldA * n1; float *const A_BL = A + 2 * n1; float *const A_BR = A + 2 * *ldA * n1 + 2 * n1; // recursion(A_TL) RELAPACK_clauum_rec(uplo, &n1, A_TL, ldA, info); if (*uplo == 'L') { // A_TL = A_TL + A_BL' * A_BL BLAS(cherk)("L", "C", &n1, &n2, ONE, A_BL, ldA, ONE, A_TL, ldA); // A_BL = A_BR' * A_BL BLAS(ctrmm)("L", "L", "C", "N", &n2, &n1, ONE, A_BR, ldA, A_BL, ldA); } else { // A_TL = A_TL + A_TR * A_TR' BLAS(cherk)("U", "N", &n1, &n2, ONE, A_TR, ldA, ONE, A_TL, ldA); // A_TR = A_TR * A_BR' BLAS(ctrmm)("R", "U", "C", "N", &n1, &n2, ONE, A_BR, ldA, A_TR, ldA); } // recursion(A_BR) RELAPACK_clauum_rec(uplo, &n2, A_BR, ldA, info); }