18 #define A(m,n) BLKADDR(A, PLASMA_Complex64_t, m, n)
19 #define C(m,n) BLKADDR(C, PLASMA_Complex64_t, m, n)
37 int ldam, ldan, ldak, ldcm, ldcn;
38 int tempkn, tempkm, tempmm, tempnn;
49 while (m >= C.
mt && n < C.
nt) {
57 while (next_m >= C.
mt && next_n < C.
nt) {
59 next_m = next_m - C.
mt + next_n;
62 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
63 tempnn = n == C.
nt-1 ? C.
n-n*C.
nb : C.
nb;
72 for (k = 0; k < A.
nt; k++) {
73 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
74 zbeta = k == 0 ? beta : zone;
79 zbeta,
C(m, n), ldcm);
86 for (k = 0; k < A.
mt; k++) {
87 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
89 zbeta = k == 0 ? beta : zone;
94 zbeta,
C(m, n), ldcm);
107 for (k = 0; k < A.
nt; k++) {
108 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
109 zbeta = k == 0 ? beta : zone;
112 tempmm, tempnn, tempkn,
113 alpha,
A(m, k), ldam,
115 zbeta,
C(m, n), ldcm);
123 for (k = 0; k < A.
nt; k++) {
124 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
125 zbeta = k == 0 ? beta : zone;
128 tempnn, tempmm, tempkn,
129 alpha,
A(n, k), ldan,
131 zbeta,
C(n, m), ldcn);
141 for (k = 0; k < A.
mt; k++) {
142 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
144 zbeta = k == 0 ? beta : zone;
147 tempmm, tempnn, tempkm,
148 alpha,
A(k, m), ldak,
150 zbeta,
C(m, n), ldcm);
158 for (k = 0; k < A.
mt; k++) {
159 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
161 zbeta = k == 0 ? beta : zone;
164 tempnn, tempmm, tempkm,
165 alpha,
A(k, n), ldak,
167 zbeta,
C(n, m), ldcn);
189 int ldak, ldam, ldan, ldcm, ldcn;
190 int tempnn, tempmm, tempkn, tempkm;
200 for (n = 0; n < C.
nt; n++) {
201 tempnn = n == C.
nt-1 ? C.
n-n*C.
nb : C.
nb;
208 for (k = 0; k < A.
nt; k++) {
209 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
210 zbeta = k == 0 ? beta : zone;
212 plasma->
quark, &task_flags,
214 tempnn, tempkn, A.
mb,
215 alpha, A(n, k), ldan,
216 zbeta,
C(n, n), ldcn);
222 for (m = n+1; m < C.
mt; m++) {
223 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
226 for (k = 0; k < A.
nt; k++) {
227 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
228 zbeta = k == 0 ? beta : zone;
230 plasma->
quark, &task_flags,
232 tempmm, tempnn, tempkn, A.
mb,
233 alpha, A(m, k), ldam,
235 zbeta,
C(m, n), ldcm);
243 for (m = n+1; m < C.
mt; m++) {
244 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
246 for (k = 0; k < A.
nt; k++) {
247 tempkn = k == A.
nt-1 ? A.
n-k*A.
nb : A.
nb;
248 zbeta = k == 0 ? beta : zone;
250 plasma->
quark, &task_flags,
252 tempnn, tempmm, tempkn, A.
mb,
253 alpha, A(n, k), ldan,
255 zbeta,
C(n, m), ldcn);
264 for (k = 0; k < A.
mt; k++) {
265 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
267 zbeta = k == 0 ? beta : zone;
269 plasma->
quark, &task_flags,
271 tempnn, tempkm, A.
mb,
272 alpha, A(k, n), ldak,
273 zbeta,
C(n, n), ldcn);
279 for (m = n+1; m < C.
mt; m++) {
280 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
282 for (k = 0; k < A.
mt; k++) {
283 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
285 zbeta = k == 0 ? beta : zone;
287 plasma->
quark, &task_flags,
289 tempmm, tempnn, tempkm, A.
mb,
290 alpha, A(k, m), ldak,
292 zbeta,
C(m, n), ldcm);
300 for (m = n+1; m < C.
mt; m++) {
301 tempmm = m == C.
mt-1 ? C.
m-m*C.
mb : C.
mb;
302 for (k = 0; k < A.
mt; k++) {
303 tempkm = k == A.
mt-1 ? A.
m-k*A.
mb : A.
mb;
305 zbeta = k == 0 ? beta : zone;
307 plasma->
quark, &task_flags,
309 tempnn, tempmm, tempkm, A.
mb,
310 alpha, A(k, n), ldak,
312 zbeta,
C(n, m), ldcn);