19 #define A(m,n) BLKADDR(A, PLASMA_Complex32_t, (m), (n))
20 #define Q(m,n) BLKADDR(Q, PLASMA_Complex32_t, (m), (n))
21 #define T(m,n) BLKADDR(T, PLASMA_Complex32_t, (m), (n))
22 #define T2(m,n) BLKADDR(T, PLASMA_Complex32_t, (m), (n)+(A.nt))
36 int ldaM, ldam, ldaMRD;
37 int ldbM, ldbm, ldbMRD;
38 int tempkn, tempMm, tempnn, tempmm, tempMRDm, tempkmin;
48 for (k = K-1; k >= 0; k--) {
49 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
51 for (RD = BS; RD < A.
mt-k; RD *= 2)
53 for (RD = lastRD; RD >= BS; RD /= 2) {
54 for (M = k; M+RD < A.
mt; M += 2*RD) {
55 tempMRDm = M+RD == A.
mt-1 ? A.
m-(M+RD)*A.
mb : A.
mb;
59 for (n = 0; n < Q.
nt; n++) {
60 tempnn = n == Q.
nt-1 ? Q.
n-n*Q.
nb : Q.
nb;
62 plasma->
quark, &task_flags,
64 A.
nb, tempnn, tempMRDm, tempnn,
73 for (M = k; M < A.
mt; M += BS) {
74 tempMm = M == A.
mt-1 ? A.
m-M*A.
mb : A.
mb;
75 tempkmin =
min(tempMm, tempkn);
78 for (m =
min(M+BS, A.
mt)-1; m > M; m--) {
79 tempmm = m == A.
mt-1 ? A.
m-m*A.
mb : A.
mb;
83 for (n = 0; n < Q.
nt; n++) {
84 tempnn = n == Q.
nt-1 ? Q.
n-n*Q.
nb : Q.
nb;
86 plasma->
quark, &task_flags,
88 A.
nb, tempnn, tempmm, tempnn,
96 for (n = 0; n < Q.
nt; n++) {
97 tempnn = n == Q.
nt-1 ? Q.
n-n*Q.
nb : Q.
nb;
99 plasma->
quark, &task_flags,