17 #define A(m,n) BLKADDR(A, PLASMA_Complex64_t, m, n)
18 #define B(m,n) BLKADDR(B, PLASMA_Complex64_t, m, n)
19 #define C(m,n) BLKADDR(C, PLASMA_Complex64_t, m, n)
41 int tempkn, tempkm, tempmm, tempnn;
52 while (m >= C.
mt && n < C.
nt) {
60 while (next_m >= C.
mt && next_n < C.
nt) {
62 next_m = next_m - C.
mt + next_n;
65 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
66 tempnn = n == C.
nt-1 ? C.
n-n*C.
nb : C.
nb;
78 for (k = 0; k < A.
nt; k++) {
79 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
80 zbeta = k == 0 ? beta : zone;
86 zbeta,
C(m, m), ldcm);
93 for (k = 0; k < A.
mt; k++) {
94 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
97 zbeta = k == 0 ? beta : zone;
101 alpha,
A(k, m), ldak,
103 zbeta,
C(m, m), ldcm);
117 for (k = 0; k < A.
nt; k++) {
118 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
119 zbeta = k == 0 ? beta : zone;
122 tempmm, tempnn, tempkn,
123 alpha,
A(m, k), ldam,
125 zbeta,
C(m, n), ldcm);
129 tempmm, tempnn, tempkn,
130 alpha,
B(m, k), ldbm,
132 zone,
C(m, n), ldcm);
139 for (k = 0; k < A.
nt; k++) {
140 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
141 zbeta = k == 0 ? beta : zone;
144 tempnn, tempmm, tempkn,
145 alpha,
A(n, k), ldan,
147 zbeta,
C(n, m), ldcn);
151 tempnn, tempmm, tempkn,
152 alpha,
B(n, k), ldbn,
154 zone,
C(n, m), ldcn);
163 for (k = 0; k < A.
mt; k++) {
166 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
167 zbeta = k == 0 ? beta : zone;
170 tempmm, tempnn, tempkm,
171 alpha,
A(k, m), ldak,
173 zbeta,
C(m, n), ldcm);
177 tempmm, tempnn, tempkm,
178 alpha,
B(k, m), ldbk,
180 zone,
C(m, n), ldcm);
187 for (k = 0; k < A.
mt; k++) {
188 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
191 zbeta = k == 0 ? beta : zone;
194 tempnn, tempmm, tempkm,
195 alpha,
A(k, n), ldak,
197 zbeta,
C(n, m), ldcm);
201 tempnn, tempmm, tempkm,
202 alpha,
B(k, n), ldbk,
204 zone,
C(n, m), ldcn);
226 int ldak, ldam, ldan, ldcm, ldcn;
227 int ldbk, ldbm, ldbn;
228 int tempnn, tempmm, tempkn, tempkm;
238 for (n = 0; n < C.
nt; n++) {
239 tempnn = n == C.
nt-1 ? C.
n-n*C.
nb : C.
nb;
247 for (k = 0; k < A.
nt; k++) {
248 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
249 zbeta = k == 0 ? beta : zone;
251 plasma->
quark, &task_flags,
253 tempnn, tempkn, A.
mb,
254 alpha, A(n, k), ldan,
256 zbeta,
C(n, n), ldcn);
262 for (m = n+1; m < C.
mt; m++) {
263 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
267 for (k = 0; k < A.
nt; k++) {
268 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
269 zbeta = k == 0 ? beta : zone;
271 plasma->
quark, &task_flags,
273 tempmm, tempnn, tempkn, A.
mb,
274 alpha, A(m, k), ldam,
276 zbeta,
C(m, n), ldcm);
279 plasma->
quark, &task_flags,
281 tempmm, tempnn, tempkn, A.
mb,
282 alpha, B(m, k), ldbm,
284 zone,
C(m, n), ldcm);
292 for (m = n+1; m < C.
mt; m++) {
293 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
296 for (k = 0; k < A.
nt; k++) {
297 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
298 zbeta = k == 0 ? beta : zone;
300 plasma->
quark, &task_flags,
302 tempnn, tempmm, tempkn, A.
mb,
303 alpha, A(n, k), ldan,
305 zbeta,
C(n, m), ldcn);
308 plasma->
quark, &task_flags,
310 tempnn, tempmm, tempkn, A.
mb,
311 alpha, B(n, k), ldan,
313 zone,
C(n, m), ldcn);
322 for (k = 0; k < A.
mt; k++) {
323 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
326 zbeta = k == 0 ? beta : zone;
328 plasma->
quark, &task_flags,
330 tempnn, tempkm, A.
mb,
331 alpha, A(k, n), ldak,
333 zbeta,
C(n, n), ldcn);
339 for (m = n+1; m < C.
mt; m++) {
340 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
342 for (k = 0; k < A.
mt; k++) {
343 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
346 zbeta = k == 0 ? beta : zone;
348 plasma->
quark, &task_flags,
350 tempmm, tempnn, tempkm, A.
mb,
351 alpha, A(k, m), ldak,
353 zbeta,
C(m, n), ldcm);
356 plasma->
quark, &task_flags,
358 tempmm, tempnn, tempkm, A.
mb,
359 alpha, B(k, m), ldbk,
361 zone,
C(m, n), ldcm);
369 for (m = n+1; m < C.
mt; m++) {
370 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
371 for (k = 0; k < A.
mt; k++) {
372 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
375 zbeta = k == 0 ? beta : zone;
377 plasma->
quark, &task_flags,
379 tempnn, tempmm, tempkm, A.
mb,
380 alpha, A(k, n), ldak,
382 zbeta,
C(n, m), ldcn);
385 plasma->
quark, &task_flags,
387 tempnn, tempmm, tempkm, A.
mb,
388 alpha, B(k, n), ldbk,
390 zone,
C(n, m), ldcn);