17 #define A(m,n) BLKADDR(A, PLASMA_Complex64_t, m, n)
18 #define C(m,n) BLKADDR(C, PLASMA_Complex64_t, m, n)
36 int ldam, ldan, ldak, ldcm, ldcn;
37 int tempkn, tempkm, tempmm, tempnn;
51 while (m >= C.
mt && n < C.
nt) {
59 while (next_m >= C.
mt && next_n < C.
nt) {
61 next_m = next_m - C.
mt + next_n;
64 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
65 tempnn = n == C.
nt-1 ? C.
n-n*C.
nb : C.
nb;
74 for (k = 0; k < A.
nt; k++) {
75 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
76 dbeta = k == 0 ? beta : 1.0;
81 dbeta,
C(m, n), ldcm);
88 for (k = 0; k < A.
mt; k++) {
89 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
91 dbeta = k == 0 ? beta : 1.0;
96 dbeta,
C(m, n), ldcm);
109 for (k = 0; k < A.
nt; k++) {
110 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
114 tempmm, tempnn, tempkn,
115 zalpha,
A(m, k), ldam,
117 zbeta,
C(m, n), ldcm);
125 for (k = 0; k < A.
nt; k++) {
126 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
130 tempnn, tempmm, tempkn,
131 zalpha,
A(n, k), ldan,
133 zbeta,
C(n, m), ldcn);
143 for (k = 0; k < A.
mt; k++) {
144 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
149 tempmm, tempnn, tempkm,
150 zalpha,
A(k, m), ldak,
152 zbeta,
C(m, n), ldcm);
160 for (k = 0; k < A.
mt; k++) {
161 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
166 tempnn, tempmm, tempkm,
167 zalpha,
A(k, n), ldak,
169 zbeta,
C(n, m), ldcn);
191 int ldak, ldam, ldan, ldcm, ldcn;
192 int tempnn, tempmm, tempkn, tempkm;
204 for (n = 0; n < C.
nt; n++) {
205 tempnn = n == C.
nt-1 ? C.
n-n*C.
nb : C.
nb;
212 for (k = 0; k < A.
nt; k++) {
213 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
214 dbeta = k == 0 ? beta : 1.0;
216 plasma->
quark, &task_flags,
218 tempnn, tempkn, A.
mb,
219 alpha, A(n, k), ldan,
220 dbeta,
C(n, n), ldcn);
226 for (m = n+1; m < C.
mt; m++) {
227 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
230 for (k = 0; k < A.
nt; k++) {
231 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
234 plasma->
quark, &task_flags,
236 tempmm, tempnn, tempkn, A.
mb,
237 zalpha, A(m, k), ldam,
239 zbeta,
C(m, n), ldcm);
247 for (m = n+1; m < C.
mt; m++) {
248 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
250 for (k = 0; k < A.
nt; k++) {
251 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
254 plasma->
quark, &task_flags,
256 tempnn, tempmm, tempkn, A.
mb,
257 zalpha, A(n, k), ldan,
259 zbeta,
C(n, m), ldcn);
268 for (k = 0; k < A.
mt; k++) {
269 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
271 dbeta = k == 0 ? beta : 1.0;
273 plasma->
quark, &task_flags,
275 tempnn, tempkm, A.
mb,
276 alpha, A(k, n), ldak,
277 dbeta,
C(n, n), ldcn);
283 for (m = n+1; m < C.
mt; m++) {
284 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
286 for (k = 0; k < A.
mt; k++) {
287 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
291 plasma->
quark, &task_flags,
293 tempmm, tempnn, tempkm, A.
mb,
294 zalpha, A(k, m), ldak,
296 zbeta,
C(m, n), ldcm);
304 for (m = n+1; m < C.
mt; m++) {
305 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
306 for (k = 0; k < A.
mt; k++) {
307 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
311 plasma->
quark, &task_flags,
313 tempnn, tempmm, tempkm, A.
mb,
314 zalpha, A(k, n), ldak,
316 zbeta,
C(n, m), ldcn);