PLASMA  2.7.0
PLASMA - Parallel Linear Algebra for Scalable Multi-core Architectures
 All Data Structures Functions Variables Modules
core_sblas.h
1 
18 #ifndef _PLASMA_CORE_SBLAS_H_
19 #define _PLASMA_CORE_SBLAS_H_
20 
21 #define REAL
22 
23 #ifdef __cplusplus
24 extern "C" {
25 #endif
26 
30 void CORE_sasum(int storev, PLASMA_enum uplo, int M, int N,
31  const float *A, int lda, float *work);
32 void CORE_sbrdalg1( PLASMA_enum uplo,
33  int n,
34  int nb,
35  float *A,
36  int lda,
37  float *VQ,
38  float *TAUQ,
39  float *VP,
40  float *TAUP,
41  int Vblksiz, int wantz,
42  int i, int sweepid, int m, int grsiz,
43  float *work);
44 int CORE_sgbelr(PLASMA_enum uplo, int N,
45  PLASMA_desc *A, float *V, float *TAU,
46  int st, int ed, int eltsize);
47 int CORE_sgbrce(PLASMA_enum uplo, int N,
48  PLASMA_desc *A, float *V, float *TAU,
49  int st, int ed, int eltsize);
50 int CORE_sgblrx(PLASMA_enum uplo, int N,
51  PLASMA_desc *A, float *V, float *TAU,
52  int st, int ed, int eltsize);
53 int CORE_sgeadd(int M, int N, float alpha,
54  const float *A, int LDA,
55  float *B, int LDB);
56 int CORE_sgelqt(int M, int N, int IB,
57  float *A, int LDA,
58  float *T, int LDT,
59  float *TAU,
60  float *WORK);
61 void CORE_sgemm(PLASMA_enum transA, PLASMA_enum transB,
62  int M, int N, int K,
63  float alpha, const float *A, int LDA,
64  const float *B, int LDB,
65  float beta, float *C, int LDC);
66 void CORE_sgemv(PLASMA_enum trans, int M, int N,
67  float alpha, const float *A, int LDA,
68  const float *x, int incx,
69  float beta, float *y, int incy);
70 void CORE_sgeqp3_init( int n, int *jpvt );
71 void CORE_sgeqp3_larfg( PLASMA_desc A, int ii, int jj, int i, int j,
72  float *tau, float *beta );
73 void CORE_sgeqp3_norms( PLASMA_desc A, int ioff, int joff, float *norms1, float *norms2 );
74 void CORE_sgeqp3_pivot( PLASMA_desc A, float *F, int ldf,
75  int jj, int k, int *jpvt,
76  float *norms1, float *norms2, int *info );
77 int CORE_sgeqp3_tntpiv(int m, int n,
78  float *A, int lda,
79  int *IPIV, float *tau,
80  int *iwork);
81 void CORE_sgeqp3_update( const float *Ajj, int lda1,
82  float *Ajk, int lda2,
83  const float *Fk, int ldf,
84  int joff, int k, int koff, int nb,
85  float *norms1, float *norms2,
86  int *info );
87 int CORE_sgeqrt(int M, int N, int IB,
88  float *A, int LDA,
89  float *T, int LDT,
90  float *TAU, float *WORK);
91 int CORE_sgessm(int M, int N, int K, int IB,
92  const int *IPIV,
93  const float *L, int LDL,
94  float *A, int LDA);
95 int CORE_sgessq(int M, int N,
96  const float *A, int LDA,
97  float *scale, float *sumsq);
98 int CORE_sgetf2_nopiv(int m, int n,
99  float *A, int lda);
100 int CORE_sgetrf(int M, int N,
101  float *A, int LDA,
102  int *IPIV, int *INFO);
103 int CORE_sgetrf_incpiv(int M, int N, int IB,
104  float *A, int LDA,
105  int *IPIV, int *INFO);
106 int CORE_sgetrf_nopiv(int m, int n, int ib,
107  float *A, int lda);
108 int CORE_sgetrf_reclap(int M, int N,
109  float *A, int LDA,
110  int *IPIV, int *info);
111 void CORE_sgetrf_reclap_init(void);
112 int CORE_sgetrf_rectil(const PLASMA_desc A, int *IPIV, int *info);
113 void CORE_sgetrf_rectil_init(void);
114 void CORE_sgetrip(int m, int n, float *A,
115  float *work);
116 int CORE_shbelr(PLASMA_enum uplo, int N,
117  PLASMA_desc *A, float *V, float *TAU,
118  int st, int ed, int eltsize);
119 int CORE_shblrx(PLASMA_enum uplo, int N,
120  PLASMA_desc *A, float *V, float *TAU,
121  int st, int ed, int eltsize);
122 int CORE_shbrce(PLASMA_enum uplo, int N,
123  PLASMA_desc *A, float *V, float *TAU,
124  int st, int ed, int eltsize);
125 void CORE_ssbtype1cb(int N, int NB,
126  float *A, int LDA,
127  float *V, float *TAU,
128  int st, int ed, int sweep, int Vblksiz, int WANTZ,
129  float *WORK);
130 void CORE_ssbtype2cb(int N, int NB,
131  float *A, int LDA,
132  float *V, float *TAU,
133  int st, int ed, int sweep, int Vblksiz, int WANTZ,
134  float *WORK);
135 void CORE_ssbtype3cb(int N, int NB,
136  float *A, int LDA,
137  const float *V, const float *TAU,
138  int st, int ed, int sweep, int Vblksiz, int WANTZ,
139  float *WORK);
140 void CORE_sgbtype1cb(PLASMA_enum uplo, int N, int NB,
141  float *A, int LDA,
142  float *VQ, float *TAUQ,
143  float *VP, float *TAUP,
144  int st, int ed, int sweep, int Vblksiz, int WANTZ,
145  float *WORK);
146 void CORE_sgbtype2cb(PLASMA_enum uplo, int N, int NB,
147  float *A, int LDA,
148  float *VQ, float *TAUQ,
149  float *VP, float *TAUP,
150  int st, int ed, int sweep, int Vblksiz, int WANTZ,
151  float *WORK);
152 void CORE_sgbtype3cb(PLASMA_enum uplo, int N, int NB,
153  float *A, int LDA,
154  float *VQ, float *TAUQ,
155  float *VP, float *TAUP,
156  int st, int ed, int sweep, int Vblksiz, int WANTZ,
157  float *WORK);
158 void CORE_ssygst(int itype, PLASMA_enum uplo, int N,
159  float *A, int LDA,
160  float *B, int LDB, int *INFO);
161 #ifdef COMPLEX
162 void CORE_ssymm(PLASMA_enum side, PLASMA_enum uplo,
163  int M, int N,
164  float alpha, const float *A, int LDA,
165  const float *B, int LDB,
166  float beta, float *C, int LDC);
167 void CORE_ssyrk(PLASMA_enum uplo, PLASMA_enum trans,
168  int N, int K,
169  float alpha, const float *A, int LDA,
170  float beta, float *C, int LDC);
171 void CORE_ssyr2k(PLASMA_enum uplo, PLASMA_enum trans,
172  int N, int K,
173  float alpha, const float *A, int LDA,
174  const float *B, int LDB,
175  float beta, float *C, int LDC);
176 int CORE_shessq(PLASMA_enum uplo, int N,
177  const float *A, int LDA,
178  float *scale, float *sumsq);
179 #endif
180 int CORE_ssyrfb(PLASMA_enum uplo, int N, int K, int IB, int NB,
181  const float *A, int LDA,
182  const float *T, int LDT,
183  float *C, int LDC,
184  float *WORK, int LDWORK);
185 void CORE_slacpy(PLASMA_enum uplo, int M, int N,
186  const float *A, int LDA,
187  float *B, int LDB);
188 int CORE_slacpy_pivot( const PLASMA_desc descA,
189  PLASMA_enum direct,
190  int k1, int k2, const int *ipiv,
191  int *rankin, int *rankout,
192  float *A, int lda,
193  int init);
194 void CORE_slange(int norm, int M, int N,
195  const float *A, int LDA,
196  float *work, float *normA);
197 #ifdef COMPLEX
198 void CORE_slansy(int norm, PLASMA_enum uplo, int N,
199  const float *A, int LDA,
200  float *work, float *normA);
201 #endif
202 void CORE_slansy(int norm, PLASMA_enum uplo, int N,
203  const float *A, int LDA,
204  float *work, float *normA);
205 void CORE_slantr(PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag,
206  int M, int N,
207  const float *A, int LDA,
208  float *work, float *normA);
209 int CORE_slarfb_gemm(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev,
210  int M, int N, int K,
211  const float *V, int LDV,
212  const float *T, int LDT,
213  float *C, int LDC,
214  float *WORK, int LDWORK);
215 int CORE_slarfx2(PLASMA_enum side, int N,
216  float V,
217  float TAU,
218  float *C1, int LDC1,
219  float *C2, int LDC2);
220 int CORE_slarfx2c(PLASMA_enum uplo,
221  float V,
222  float TAU,
223  float *C1,
224  float *C2,
225  float *C3);
226 int CORE_slarfx2ce(PLASMA_enum uplo,
227  float *V,
228  float *TAU,
229  float *C1,
230  float *C2,
231  float *C3);
232 void CORE_slarfy(int N,
233  float *A, int LDA,
234  const float *V,
235  const float *TAU,
236  float *WORK);
237 void CORE_slaset(PLASMA_enum uplo, int n1, int n2,
238  float alpha, float beta,
239  float *tileA, int ldtilea);
240 void CORE_slaset2(PLASMA_enum uplo, int n1, int n2, float alpha,
241  float *tileA, int ldtilea);
242 void CORE_slaswp(int N, float *A, int LDA,
243  int I1, int I2, const int *IPIV, int INC);
244 int CORE_slaswp_ontile( PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc);
245 int CORE_slaswpc_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc);
246 int CORE_slatro(PLASMA_enum uplo, PLASMA_enum trans,
247  int M, int N,
248  const float *A, int LDA,
249  float *B, int LDB);
250 void CORE_slauum(PLASMA_enum uplo, int N, float *A, int LDA);
251 int CORE_spamm(int op, PLASMA_enum side, PLASMA_enum storev,
252  int M, int N, int K, int L,
253  const float *A1, int LDA1,
254  float *A2, int LDA2,
255  const float *V, int LDV,
256  float *W, int LDW);
257 int CORE_sparfb(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev,
258  int M1, int N1, int M2, int N2, int K, int L,
259  float *A1, int LDA1,
260  float *A2, int LDA2,
261  const float *V, int LDV,
262  const float *T, int LDT,
263  float *WORK, int LDWORK);
264 int CORE_spemv(PLASMA_enum trans, PLASMA_enum storev,
265  int M, int N, int L,
266  float ALPHA,
267  const float *A, int LDA,
268  const float *X, int INCX,
269  float BETA,
270  float *Y, int INCY,
271  float *WORK);
272 void CORE_splgsy(float bump, int m, int n, float *A, int lda,
273  int bigM, int m0, int n0, unsigned long long int seed );
274 void CORE_splgsy(float bump, int m, int n, float *A, int lda,
275  int bigM, int m0, int n0, unsigned long long int seed );
276 void CORE_splrnt(int m, int n, float *A, int lda,
277  int bigM, int m0, int n0, unsigned long long int seed );
278 int CORE_spltmg(PLASMA_enum mtxtype, int m, int n, float *A, int lda,
279  int gM, int gN, int m0, int n0, unsigned long long int seed );
280 int CORE_spltmg_chebvand( int M, int N, float *A, int LDA,
281  int gN, int m0, int n0,
282  float *W );
283 int CORE_spltmg_circul( int M, int N, float *A, int LDA,
284  int gM, int m0, int n0,
285  const float *V );
286 void CORE_spltmg_condexq( int M, int N, float *Q, int LDQ );
287 void CORE_spltmg_fiedler(int m, int n,
288  const float *X, int incX,
289  const float *Y, int incY,
290  float *A, int lda);
291 int CORE_spltmg_hankel( PLASMA_enum uplo, int M, int N, float *A, int LDA,
292  int m0, int n0, int nb,
293  const float *V1,
294  const float *V2 );
295 void CORE_spltmg_toeppd1( int gM, int m0, int M, float *W,
296  unsigned long long int seed );
297 void CORE_spltmg_toeppd2( int M, int N, int K, int m0, int n0,
298  const float *W,
299  float *A, int LDA );
300 void CORE_spotrf(PLASMA_enum uplo, int N, float *A, int LDA, int *INFO);
301 void CORE_ssetvar(const float *alpha, float *x);
302 void CORE_sshift(int s, int m, int n, int L,
303  float *A);
304 void CORE_sshiftw(int s, int cl, int m, int n, int L,
305  float *A, float *W);
306 int CORE_sssssm(int M1, int N1, int M2, int N2, int K, int IB,
307  float *A1, int LDA1,
308  float *A2, int LDA2,
309  const float *L1, int LDL1,
310  const float *L2, int LDL2,
311  const int *IPIV);
312 int CORE_sstedc(PLASMA_enum compz, int n,
313  float *D, float *E,
314  float *Z, int LDZ,
315  float *WORK, int LWORK,
316 #ifdef COMPLEX
317  float *RWORK, int LRWORK,
318 #endif
319  int *IWORK, int LIWORK);
320 int CORE_ssteqr(PLASMA_enum compz, int n,
321  float *D, float *E,
322  float *Z, int LDZ,
323  float *WORK);
324 void CORE_ssymm(PLASMA_enum side, PLASMA_enum uplo,
325  int M, int N,
326  float alpha, const float *A, int LDA,
327  const float *B, int LDB,
328  float beta, float *C, int LDC);
329 void CORE_ssyrk(PLASMA_enum uplo, PLASMA_enum trans,
330  int N, int K,
331  float alpha, const float *A, int LDA,
332  float beta, float *C, int LDC);
333 void CORE_ssyr2k(PLASMA_enum uplo, PLASMA_enum trans,
334  int N, int K,
335  float alpha, const float *A, int LDA,
336  const float *B, int LDB,
337  float beta, float *C, int LDC);
338 int CORE_ssyssq(PLASMA_enum uplo, int N,
339  const float *A, int LDA,
340  float *scale, float *sumsq);
341 void CORE_sswpab(int i, int n1, int n2,
342  float *A, float *work);
343 int CORE_sswptr_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc,
344  const float *Akk, int ldak);
345 void CORE_strasm(PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag,
346  int M, int N, const float *A, int lda, float *work);
347 void CORE_strdalg1(int n,
348  int nb,
349  float *A,
350  int lda,
351  float *V,
352  float *TAU,
353  int Vblksiz, int wantz,
354  int i, int sweepid, int m, int grsiz,
355  float *work);
356 void CORE_strmm(PLASMA_enum side, PLASMA_enum uplo,
357  PLASMA_enum transA, PLASMA_enum diag,
358  int M, int N,
359  float alpha, const float *A, int LDA,
360  float *B, int LDB);
361 void CORE_strsm(PLASMA_enum side, PLASMA_enum uplo,
362  PLASMA_enum transA, PLASMA_enum diag,
363  int M, int N,
364  float alpha, const float *A, int LDA,
365  float *B, int LDB);
366 int CORE_strssq(PLASMA_enum uplo, PLASMA_enum diag, int M, int N,
367  const float *A, int LDA,
368  float *scale, float *sumsq);
369 void CORE_strtri(PLASMA_enum uplo, PLASMA_enum diag, int N,
370  float *A, int LDA, int *info);
371 int CORE_stslqt(int M, int N, int IB,
372  float *A1, int LDA1,
373  float *A2, int LDA2,
374  float *T, int LDT,
375  float *TAU, float *WORK);
376 int CORE_stsmlq(PLASMA_enum side, PLASMA_enum trans,
377  int M1, int N1, int M2, int N2, int K, int IB,
378  float *A1, int LDA1,
379  float *A2, int LDA2,
380  const float *V, int LDV,
381  const float *T, int LDT,
382  float *WORK, int LDWORK);
383 int CORE_stsmlq_corner( int m1, int n1, int m2, int n2, int m3, int n3,
384  int k, int ib, int nb,
385  float *A1, int lda1,
386  float *A2, int lda2,
387  float *A3, int lda3,
388  const float *V, int ldv,
389  const float *T, int ldt,
390  float *WORK, int ldwork);
391 int CORE_stsmlq_sytra1( PLASMA_enum side, PLASMA_enum trans,
392  int m1, int n1, int m2, int n2,
393  int k, int ib,
394  float *A1, int lda1,
395  float *A2, int lda2,
396  const float *V, int ldv,
397  const float *T, int ldt,
398  float *WORK, int ldwork);
399 int CORE_stsmqr(PLASMA_enum side, PLASMA_enum trans,
400  int M1, int N1, int M2, int N2, int K, int IB,
401  float *A1, int LDA1,
402  float *A2, int LDA2,
403  const float *V, int LDV,
404  const float *T, int LDT,
405  float *WORK, int LDWORK);
406 int CORE_stsmqr_corner( int m1, int n1, int m2, int n2, int m3, int n3,
407  int k, int ib, int nb,
408  float *A1, int lda1,
409  float *A2, int lda2,
410  float *A3, int lda3,
411  const float *V, int ldv,
412  const float *T, int ldt,
413  float *WORK, int ldwork);
414 int CORE_stsmqr_sytra1( PLASMA_enum side, PLASMA_enum trans,
415  int m1, int n1, int m2, int n2,
416  int k, int ib,
417  float *A1, int lda1,
418  float *A2, int lda2,
419  const float *V, int ldv,
420  const float *T, int ldt,
421  float *WORK, int ldwork);
422 int CORE_stsqrt(int M, int N, int IB,
423  float *A1, int LDA1,
424  float *A2, int LDA2,
425  float *T, int LDT,
426  float *TAU, float *WORK);
427 int CORE_ststrf(int M, int N, int IB, int NB,
428  float *U, int LDU,
429  float *A, int LDA,
430  float *L, int LDL,
431  int *IPIV, float *WORK,
432  int LDWORK, int *INFO);
433 int CORE_sttmqr(PLASMA_enum side, PLASMA_enum trans,
434  int M1, int N1, int M2, int N2, int K, int IB,
435  float *A1, int LDA1,
436  float *A2, int LDA2,
437  const float *V, int LDV,
438  const float *T, int LDT,
439  float *WORK, int LDWORK);
440 int CORE_sttqrt(int M, int N, int IB,
441  float *A1, int LDA1,
442  float *A2, int LDA2,
443  float *T, int LDT,
444  float *TAU,
445  float *WORK);
446 int CORE_sttmlq(PLASMA_enum side, PLASMA_enum trans,
447  int M1, int N1, int M2, int N2, int K, int IB,
448  float *A1, int LDA1,
449  float *A2, int LDA2,
450  const float *V, int LDV,
451  const float *T, int LDT,
452  float *WORK, int LDWORK);
453 int CORE_sttlqt(int M, int N, int IB,
454  float *A1, int LDA1,
455  float *A2, int LDA2,
456  float *T, int LDT,
457  float *TAU,
458  float *WORK);
459 int CORE_sormlq(PLASMA_enum side, PLASMA_enum trans,
460  int M, int N, int IB, int K,
461  const float *V, int LDV,
462  const float *T, int LDT,
463  float *C, int LDC,
464  float *WORK, int LDWORK);
465 int CORE_sormqr(PLASMA_enum side, PLASMA_enum trans,
466  int M, int N, int K, int IB,
467  const float *V, int LDV,
468  const float *T, int LDT,
469  float *C, int LDC,
470  float *WORK, int LDWORK);
471 
472 #ifndef COMPLEX
473 void CORE_slaed2_computeK(int *K, int n, int n1,
474  float *beta, float *D, float *Q, int LDQ,
475  float *Z, float *DLAMBDA, float *W,
476  int *INDX, int *INDXC, int *INDXP, int *INDXQ,
477  int *COLTYP);
478 void CORE_slaed2_compressq(int n, int n1, const int *INDX, const int *ctot,
479  const float *Q, int LDQ, float *Q2,
480  int start, int end);
481 void CORE_slaed2_copydef(int n, int n1, int K, const int *ctot,
482  float *Q, int LDQ, const float *Q2,
483  int start, int end);
484 int CORE_slaed4(int n, int K,
485  float *D, float beta,
486  float *Q, int LDQ,
487  const float *D0, const float *Z,
488  const int *INDX,
489  int start, int end );
490 void CORE_slaed3_computeW(int n, int K,
491  const float *Q, int LDQ,
492  const float *DLAMBDA, float *W,
493  const int *INDX,
494  int start, int end);
495 void CORE_slaed3_reduceW(int n, int n1, int K, int l,
496  const float *Q, int LDQ,
497  const float *Wred, float *W);
498 void CORE_slaed3_computevectors(int K, int il_nondef, int iu_nondef,
499  float *Q, int LDQ, float *W, float *S,
500  const int *INDXC,
501  int start, int end);
502 void CORE_slaed3_merge( int n, int K, float *D, int *INDXQ );
503 void CORE_slaed3_updatevectors(int op, int wsmode, int n, int n1, int K,
504  int il_nondef, int iu_nondef,
505  float *Q, int ldq, float *Q2,
506  const int *ctot, float *WORK, int start, int end);
507 #endif
508 void CORE_sswap(int m, int n, float *Q, int ldq,
509  const float *work, const int *perm,
510  int start, int end);
511 int CORE_slascl(PLASMA_enum type, int kl, int ku, float cfrom, float cto,
512  int m, int n, float *A, int lda);
513 #ifdef COMPLEX
514 int CORE_slag2c(int m, int n, const float *Q, int LDQ,
515  float *Z, int LDZ);
516 #endif
517 
518 #ifndef COMPLEX
519 void CORE_slaed3_freebigwork(int oper, float **WORK);
520 void CORE_slaed0_betaapprox(int subpbs, const int *subpbs_info,
521  float *D, const float *E);
522 int CORE_slapst(PLASMA_enum type, int n,
523  const float *D, int *INDX);
524 #endif
525 
526 #if defined(QUARK_H)
527 
530 void QUARK_CORE_sasum(Quark *quark, Quark_Task_Flags *task_flags,
531  PLASMA_enum storev, PLASMA_enum uplo, int m, int n,
532  const float *A, int lda, int szeA,
533  float *work, int szeW);
534 void QUARK_CORE_sasum_f1(Quark *quark, Quark_Task_Flags *task_flags,
535  PLASMA_enum storev, PLASMA_enum uplo, int m, int n,
536  const float *A, int lda, int szeA,
537  float *work, int szeW,
538  float *fake, int szeF);
539 void QUARK_CORE_sgeadd(Quark *quark, Quark_Task_Flags *task_flags,
540  int m, int n, int nb, float alpha,
541  const float *A, int lda,
542  float *B, int ldb);
543 void QUARK_CORE_sbrdalg1(Quark *quark, Quark_Task_Flags *task_flags,
544  PLASMA_enum uplo,
545  int n, int nb,
546  float *A,
547  int lda,
548  float *VQ,
549  float *TAUQ,
550  float *VP,
551  float *TAUP,
552  int Vblksiz, int wantz,
553  int i, int sweepid, int m, int grsiz,
554  int *PCOL, int *ACOL, int *MCOL);
555 void QUARK_CORE_sgelqt(Quark *quark, Quark_Task_Flags *task_flags,
556  int m, int n, int ib, int nb,
557  float *A, int lda,
558  float *T, int ldt);
559 void QUARK_CORE_sgemm(Quark *quark, Quark_Task_Flags *task_flags,
560  PLASMA_enum transA, PLASMA_enum transB,
561  int m, int n, int k, int nb,
562  float alpha, const float *A, int lda,
563  const float *B, int ldb,
564  float beta, float *C, int ldc);
565 void QUARK_CORE_sgemm2( Quark *quark, Quark_Task_Flags *task_flags,
566  PLASMA_enum transA, PLASMA_enum transB,
567  int m, int n, int k, int nb,
568  float alpha, const float *A, int lda,
569  const float *B, int ldb,
570  float beta, float *C, int ldc);
571 void QUARK_CORE_sgemm_f2(Quark *quark, Quark_Task_Flags *task_flags,
572  PLASMA_enum transA, PLASMA_enum transB,
573  int m, int n, int k, int nb,
574  float alpha, const float *A, int lda,
575  const float *B, int ldb,
576  float beta, float *C, int ldc,
577  float *fake1, int szefake1, int flag1,
578  float *fake2, int szefake2, int flag2);
579 void QUARK_CORE_sgemm_p2(Quark *quark, Quark_Task_Flags *task_flags,
580  PLASMA_enum transA, PLASMA_enum transB,
581  int m, int n, int k, int nb,
582  float alpha, const float *A, int lda,
583  const float **B, int ldb,
584  float beta, float *C, int ldc);
585 void QUARK_CORE_sgemm_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
586  PLASMA_enum transA, PLASMA_enum transB,
587  int m, int n, int k, int nb,
588  float alpha, const float *A, int lda,
589  const float **B, int ldb,
590  float beta, float *C, int ldc,
591  float *fake1, int szefake1, int flag1);
592 void QUARK_CORE_sgemm_p3(Quark *quark, Quark_Task_Flags *task_flags,
593  PLASMA_enum transA, PLASMA_enum transB,
594  int m, int n, int k, int nb,
595  float alpha, const float *A, int lda,
596  const float *B, int ldb,
597  float beta, float **C, int ldc);
598 void QUARK_CORE_sgemm_tile(Quark *quark, Quark_Task_Flags *task_flags,
599  PLASMA_enum transA, PLASMA_enum transB,
600  int m, int n, int k, int nb,
601  const float *alpha, const float *A, int lda,
602  const float *B, int ldb,
603  const float *beta, float *C, int ldc,
604  const float *Alock,
605  const float *Block,
606  const float *Clock);
607 void QUARK_CORE_sgemv(Quark *quark, Quark_Task_Flags *task_flags,
608  PLASMA_enum trans, int m, int n,
609  float alpha, const float *A, int lda,
610  const float *x, int incx,
611  float beta, float *y, int incy);
612 void QUARK_CORE_sgemv_tile(Quark *quark, Quark_Task_Flags *task_flags,
613  PLASMA_enum trans,
614  int m, int n,
615  const float *alpha, const float *A, int lda,
616  const float *x, int incx,
617  const float *beta, float *y, int incy,
618  const float *Alock,
619  const float *xlock,
620  const float *ylock);
621 void QUARK_CORE_sgeqp3_init( Quark *quark, Quark_Task_Flags *task_flags,
622  int n, int *jpvt );
623 void QUARK_CORE_sgeqp3_larfg(Quark *quark, Quark_Task_Flags *task_flags,
624  PLASMA_desc A, int ii, int jj, int i, int j,
625  float *tau, float *beta );
626 void QUARK_CORE_sgeqp3_norms( Quark *quark, Quark_Task_Flags *task_flags,
627  PLASMA_desc A, int ioff, int joff, float *norms1, float *norms2 );
628 void QUARK_CORE_sgeqp3_pivot( Quark *quark, Quark_Task_Flags *task_flags,
629  PLASMA_desc A,
630  float *F, int ldf,
631  int jj, int k, int *jpvt,
632  float *norms1, float *norms2, int *info );
633 void QUARK_CORE_sgeqp3_tntpiv(Quark *quark, Quark_Task_Flags *task_flags,
634  int m, int n, int nb,
635  float *A, int lda,
636  int *IPIV,
637  PLASMA_sequence *sequence, PLASMA_request *request,
638  PLASMA_bool check_info, int iinfo);
639 void QUARK_CORE_sgeqp3_update( Quark *quark, Quark_Task_Flags *task_flags,
640  float *Ajj, int lda1,
641  float *Ajk, int lda2,
642  float *Fk, int ldf,
643  int joff, int k, int koff, int nb,
644  float *norms1, float *norms2, int *info );
645 void QUARK_CORE_sgeqrt(Quark *quark, Quark_Task_Flags *task_flags,
646  int m, int n, int ib, int nb,
647  float *A, int lda,
648  float *T, int ldt);
649 void QUARK_CORE_sgessm(Quark *quark, Quark_Task_Flags *task_flags,
650  int m, int n, int k, int ib, int nb,
651  const int *IPIV,
652  const float *L, int ldl,
653  float *A, int lda);
654 void QUARK_CORE_sgessq_f1( Quark *quark, Quark_Task_Flags *task_flags,
655  int m, int n, const float *A, int lda,
656  float *scale, float *sumsq,
657  float *fake, int szeF, int paramF );
658 void QUARK_CORE_sgetrf(Quark *quark, Quark_Task_Flags *task_flags,
659  int m, int n, int nb,
660  float *A, int lda,
661  int *IPIV,
662  PLASMA_sequence *sequence, PLASMA_request *request,
663  PLASMA_bool check_info, int iinfo);
664 void QUARK_CORE_sgetrf_incpiv(Quark *quark, Quark_Task_Flags *task_flags,
665  int m, int n, int ib, int nb,
666  float *A, int lda,
667  int *IPIV,
668  PLASMA_sequence *sequence, PLASMA_request *request,
669  PLASMA_bool check_info, int iinfo);
670 void QUARK_CORE_sgetrf_nopiv(Quark *quark, Quark_Task_Flags *task_flags,
671  int m, int n, int ib, int nb,
672  float *A, int lda,
673  PLASMA_sequence *sequence, PLASMA_request *request,
674  int iinfo);
675 void QUARK_CORE_sgetrf_reclap(Quark *quark, Quark_Task_Flags *task_flags,
676  int m, int n, int nb,
677  float *A, int lda,
678  int *IPIV,
679  PLASMA_sequence *sequence, PLASMA_request *request,
680  PLASMA_bool check_info, int iinfo,
681  int nbthread);
682 void QUARK_CORE_sgetrf_rectil(Quark *quark, Quark_Task_Flags *task_flags,
683  PLASMA_desc A, float *Amn, int size,
684  int *IPIV,
685  PLASMA_sequence *sequence, PLASMA_request *request,
686  PLASMA_bool check_info, int iinfo,
687  int nbthread);
688 void QUARK_CORE_sgetrip(Quark *quark, Quark_Task_Flags *task_flags,
689  int m, int n, float *A, int szeA);
690 void QUARK_CORE_sgetrip_f1(Quark *quark, Quark_Task_Flags *task_flags,
691  int m, int n, float *A, int szeA,
692  float *fake, int szeF, int paramF);
693 void QUARK_CORE_sgetrip_f2(Quark *quark, Quark_Task_Flags *task_flags,
694  int m, int n, float *A, int szeA,
695  float *fake1, int szeF1, int paramF1,
696  float *fake2, int szeF2, int paramF2);
697 void QUARK_CORE_ssymm(Quark *quark, Quark_Task_Flags *task_flags,
698  PLASMA_enum side, PLASMA_enum uplo,
699  int m, int n, int nb,
700  float alpha, const float *A, int lda,
701  const float *B, int ldb,
702  float beta, float *C, int ldc);
703 void QUARK_CORE_ssygst(Quark *quark, Quark_Task_Flags *task_flags,
704  int itype, PLASMA_enum uplo, int N,
705  float *A, int LDA,
706  float *B, int LDB,
707  PLASMA_sequence *sequence, PLASMA_request *request,
708  int iinfo);
709 void QUARK_CORE_ssyrk(Quark *quark, Quark_Task_Flags *task_flags,
710  PLASMA_enum uplo, PLASMA_enum trans,
711  int n, int k, int nb,
712  float alpha, const float *A, int lda,
713  float beta, float *C, int ldc);
714 void QUARK_CORE_ssyr2k(Quark *quark, Quark_Task_Flags *task_flags,
715  PLASMA_enum uplo, PLASMA_enum trans,
716  int n, int k, int nb,
717  float alpha, const float *A, int lda,
718  const float *B, int LDB,
719  float beta, float *C, int ldc);
720 void QUARK_CORE_ssyrfb(Quark *quark, Quark_Task_Flags *task_flags,
721  PLASMA_enum uplo,
722  int n, int k, int ib, int nb,
723  const float *A, int lda,
724  const float *T, int ldt,
725  float *C, int ldc);
726 void QUARK_CORE_shessq_f1( Quark *quark, Quark_Task_Flags *task_flags,
727  PLASMA_enum uplo, int n, const float *A, int lda,
728  float *scale, float *sumsq,
729  float *fake, int szeF, int paramF );
730 void QUARK_CORE_slacpy(Quark *quark, Quark_Task_Flags *task_flags,
731  PLASMA_enum uplo, int m, int n, int mb,
732  const float *A, int lda,
733  float *B, int ldb);
734 void QUARK_CORE_slacpy_f1(Quark *quark, Quark_Task_Flags *task_flags,
735  PLASMA_enum uplo, int m, int n, int nb,
736  const float *A, int lda,
737  float *B, int ldb,
738  float *fake1, int szefake1, int flag1);
739 void QUARK_CORE_slacpy_pivot(Quark *quark, Quark_Task_Flags *task_flags,
740  const PLASMA_desc descA,
741  PLASMA_enum direct,
742  int k1, int k2, const int *ipiv,
743  int *rankin, int *rankout,
744  float *A, int lda,
745  int pos, int init);
746 void QUARK_CORE_slange(Quark *quark, Quark_Task_Flags *task_flags,
747  int norm, int M, int N,
748  const float *A, int LDA, int szeA,
749  int szeW, float *result);
750 void QUARK_CORE_slange_f1(Quark *quark, Quark_Task_Flags *task_flags,
751  int norm, int M, int N,
752  const float *A, int LDA, int szeA,
753  int szeW, float *result,
754  float *fake, int szeF);
755 #ifdef COMPLEX
756 void QUARK_CORE_slansy(Quark *quark, Quark_Task_Flags *task_flags,
757  int norm, PLASMA_enum uplo, int N,
758  const float *A, int LDA, int szeA,
759  int szeW, float *result);
760 void QUARK_CORE_slansy_f1(Quark *quark, Quark_Task_Flags *task_flags,
761  int norm, PLASMA_enum uplo, int N,
762  const float *A, int LDA, int szeA,
763  int szeW, float *result,
764  float *fake, int szeF);
765 #endif
766 void QUARK_CORE_slansy(Quark *quark, Quark_Task_Flags *task_flags,
767  int norm, PLASMA_enum uplo, int N,
768  const float *A, int LDA, int szeA,
769  int szeW, float *result);
770 void QUARK_CORE_slansy_f1(Quark *quark, Quark_Task_Flags *task_flags,
771  int norm, PLASMA_enum uplo, int N,
772  const float *A, int LDA, int szeA,
773  int szeW, float *result,
774  float *fake, int szeF);
775 void QUARK_CORE_slantr(Quark *quark, Quark_Task_Flags *task_flags,
776  PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag, int M, int N,
777  const float *A, int LDA, int szeA,
778  int szeW, float *result);
779 void QUARK_CORE_slantr_f1(Quark *quark, Quark_Task_Flags *task_flags,
780  PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag, int M, int N,
781  const float *A, int LDA, int szeA,
782  int szeW, float *result,
783  float *fake, int szeF);
784 void QUARK_CORE_slaset(Quark *quark, Quark_Task_Flags *task_flags,
785  PLASMA_enum uplo, int n1, int n2, float alpha,
786  float beta, float *tileA, int ldtilea);
787 void QUARK_CORE_slaset2(Quark *quark, Quark_Task_Flags *task_flags,
788  PLASMA_enum uplo, int n1, int n2, float alpha,
789  float *tileA, int ldtilea);
790 void QUARK_CORE_slaswp(Quark *quark, Quark_Task_Flags *task_flags,
791  int n, float *A, int lda,
792  int i1, int i2, const int *ipiv, int inc);
793 void QUARK_CORE_slaswp_f2(Quark *quark, Quark_Task_Flags *task_flags,
794  int n, float *A, int lda,
795  int i1, int i2, const int *ipiv, int inc,
796  float *fake1, int szefake1, int flag1,
797  float *fake2, int szefake2, int flag2);
798 void QUARK_CORE_slaswp_ontile(Quark *quark, Quark_Task_Flags *task_flags,
799  PLASMA_desc descA, float *A,
800  int i1, int i2, const int *ipiv, int inc, float *fakepanel);
801 void QUARK_CORE_slaswp_ontile_f2(Quark *quark, Quark_Task_Flags *task_flags,
802  PLASMA_desc descA, float *A,
803  int i1, int i2, const int *ipiv, int inc,
804  float *fake1, int szefake1, int flag1,
805  float *fake2, int szefake2, int flag2);
806 void QUARK_CORE_slaswpc_ontile(Quark *quark, Quark_Task_Flags *task_flags,
807  PLASMA_desc descA, float *A,
808  int i1, int i2, const int *ipiv, int inc, float *fakepanel);
809 void QUARK_CORE_slatro(Quark *quark, Quark_Task_Flags *task_flags,
810  PLASMA_enum uplo, PLASMA_enum trans, int m, int n, int mb,
811  const float *A, int lda,
812  float *B, int ldb);
813 void QUARK_CORE_slatro_f1(Quark *quark, Quark_Task_Flags *task_flags,
814  PLASMA_enum uplo, PLASMA_enum trans, int m, int n, int mb,
815  const float *A, int lda,
816  float *B, int ldb,
817  float *fake1, int szefake1, int flag1);
818 void QUARK_CORE_slauum(Quark *quark, Quark_Task_Flags *task_flags,
819  PLASMA_enum uplo, int n, int nb,
820  float *A, int lda);
821 void QUARK_CORE_splgsy(Quark *quark, Quark_Task_Flags *task_flags,
822  float bump, int m, int n, float *A, int lda,
823  int bigM, int m0, int n0, unsigned long long int seed );
824 void QUARK_CORE_splgsy(Quark *quark, Quark_Task_Flags *task_flags,
825  float bump, int m, int n, float *A, int lda,
826  int bigM, int m0, int n0, unsigned long long int seed );
827 void QUARK_CORE_splrnt(Quark *quark, Quark_Task_Flags *task_flags,
828  int m, int n, float *A, int lda,
829  int bigM, int m0, int n0, unsigned long long int seed );
830 void QUARK_CORE_spltmg(Quark *quark, Quark_Task_Flags *task_flags,
831  PLASMA_enum mtxtype, int m, int n, float *A, int lda,
832  int gM, int gN, int m0, int n0, unsigned long long int seed );
833 void QUARK_CORE_spltmg_chebvand( Quark *quark, Quark_Task_Flags *task_flags,
834  int M, int N, float *A, int LDA,
835  int gN, int m0, int n0,
836  float *W );
837 void QUARK_CORE_spltmg_circul( Quark *quark, Quark_Task_Flags *task_flags,
838  int M, int N, float *A, int LDA,
839  int gM, int m0, int n0,
840  const float *W );
841 void QUARK_CORE_spltmg_fiedler(Quark *quark, Quark_Task_Flags *task_flags,
842  int m, int n,
843  const float *X, int incX,
844  const float *Y, int incY,
845  float *A, int lda);
846 void QUARK_CORE_spltmg_hankel( Quark *quark, Quark_Task_Flags *task_flags,
847  PLASMA_enum uplo, int M, int N, float *A, int LDA,
848  int m0, int n0, int nb,
849  const float *V1,
850  const float *V2);
851 void QUARK_CORE_spltmg_toeppd1(Quark *quark, Quark_Task_Flags *task_flags,
852  int gM, int m0, int M,
853  float *W,
854  unsigned long long int seed);
855 void QUARK_CORE_spltmg_toeppd2(Quark *quark, Quark_Task_Flags *task_flags,
856  int M, int N, int K, int m0, int n0,
857  const float *W,
858  float *A, int LDA );
859 void QUARK_CORE_spotrf(Quark *quark, Quark_Task_Flags *task_flags,
860  PLASMA_enum uplo, int n, int nb,
861  float *A, int lda,
862  PLASMA_sequence *sequence, PLASMA_request *request,
863  int iinfo);
864 void QUARK_CORE_ssetvar(Quark *quark, Quark_Task_Flags *task_flags,
865  const float *alpha, float *x,
866  float *Alock);
867 void QUARK_CORE_sshift( Quark *quark, Quark_Task_Flags *task_flags,
868  int s, int m, int n, int L,
869  float *A);
870 void QUARK_CORE_sshiftw(Quark *quark, Quark_Task_Flags *task_flags,
871  int s, int cl, int m, int n, int L,
872  float *A, float *W);
873 void QUARK_CORE_sssssm(Quark *quark, Quark_Task_Flags *task_flags,
874  int m1, int n1, int m2, int n2, int k, int ib, int nb,
875  float *A1, int lda1,
876  float *A2, int lda2,
877  const float *L1, int ldl1,
878  const float *L2, int ldl2,
879  const int *IPIV);
880 void QUARK_CORE_sstedc(Quark *quark, Quark_Task_Flags *task_flags,
881  PLASMA_enum compz, int n,
882  float *D, float *E,
883  float *Z, int ldz);
884 void QUARK_CORE_sstedc_f2(Quark *quark, Quark_Task_Flags *task_flags,
885  PLASMA_enum compz, int n,
886  float *D, float *E,
887  float *Z, int ldz,
888  void *fake1, int szefake1, int flag1,
889  void *fake2, int szefake2, int flag2);
890 void QUARK_CORE_ssteqr(Quark *quark, Quark_Task_Flags *task_flags,
891  PLASMA_enum compz, int n,
892  float *D, float *E,
893  float *Z, int ldz);
894 void QUARK_CORE_ssymm(Quark *quark, Quark_Task_Flags *task_flags,
895  PLASMA_enum side, PLASMA_enum uplo,
896  int m, int n, int nb,
897  float alpha, const float *A, int lda,
898  const float *B, int ldb,
899  float beta, float *C, int ldc);
900 void QUARK_CORE_ssyrk(Quark *quark, Quark_Task_Flags *task_flags,
901  PLASMA_enum uplo, PLASMA_enum trans,
902  int n, int k, int nb,
903  float alpha, const float *A, int lda,
904  float beta, float *C, int ldc);
905 void QUARK_CORE_ssyr2k(Quark *quark, Quark_Task_Flags *task_flags,
906  PLASMA_enum uplo, PLASMA_enum trans,
907  int n, int k, int nb,
908  float alpha, const float *A, int lda,
909  const float *B, int LDB,
910  float beta, float *C, int ldc);
911 void QUARK_CORE_ssyssq_f1( Quark *quark, Quark_Task_Flags *task_flags,
912  PLASMA_enum uplo, int n, const float *A, int lda,
913  float *scale, float *sumsq,
914  float *fake, int szeF, int paramF );
915 void QUARK_CORE_sswpab(Quark *quark, Quark_Task_Flags *task_flags,
916  int i, int n1, int n2,
917  float *A, int szeA);
918 void QUARK_CORE_sswptr_ontile(Quark *quark, Quark_Task_Flags *task_flags,
919  PLASMA_desc descA, float *Aij,
920  int i1, int i2, const int *ipiv, int inc,
921  const float *Akk, int ldak);
922 void QUARK_CORE_strasm(Quark *quark, Quark_Task_Flags *task_flags,
923  PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag, int m, int n,
924  const float *A, int lda, int szeA,
925  float *work, int szeW);
926 void QUARK_CORE_strasm_f1(Quark *quark, Quark_Task_Flags *task_flags,
927  PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag, int m, int n,
928  const float *A, int lda, int szeA,
929  float *work, int szeW,
930  float *fake, int szeF);
931 void QUARK_CORE_strdalg1(Quark *quark, Quark_Task_Flags *task_flags,
932  int n,
933  int nb,
934  float *A,
935  int lda,
936  float *V,
937  float *TAU,
938  int Vblksiz, int wantz,
939  int i, int sweepid, int m, int grsiz,
940  int *PCOL, int *ACOL, int *MCOL);
941 void QUARK_CORE_strmm(Quark *quark, Quark_Task_Flags *task_flags,
942  PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag,
943  int m, int n, int nb,
944  float alpha, const float *A, int lda,
945  float *B, int ldb);
946 void QUARK_CORE_strmm_p2(Quark *quark, Quark_Task_Flags *task_flags,
947  PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag,
948  int m, int n, int nb,
949  float alpha, const float *A, int lda,
950  float **B, int ldb);
951 void QUARK_CORE_strsm(Quark *quark, Quark_Task_Flags *task_flags,
952  PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag,
953  int m, int n, int nb,
954  float alpha, const float *A, int lda,
955  float *B, int ldb);
956 void QUARK_CORE_strssq_f1( Quark *quark, Quark_Task_Flags *task_flags,
957  PLASMA_enum uplo, PLASMA_enum diag,
958  int m, int n, const float *A, int lda,
959  float *scale, float *sumsq,
960  float *fake, int szeF, int paramF );
961 void QUARK_CORE_strtri(Quark *quark, Quark_Task_Flags *task_flags,
962  PLASMA_enum uplo, PLASMA_enum diag, int n, int nb,
963  float *A, int lda,
964  PLASMA_sequence *sequence, PLASMA_request *request,
965  int iinfo);
966 void QUARK_CORE_stslqt(Quark *quark, Quark_Task_Flags *task_flags,
967  int m, int n, int ib, int nb,
968  float *A1, int lda1,
969  float *A2, int lda2,
970  float *T, int ldt);
971 void QUARK_CORE_stsmlq(Quark *quark, Quark_Task_Flags *task_flags,
972  PLASMA_enum side, PLASMA_enum trans,
973  int m1, int n1, int m2, int n2, int k, int ib, int nb,
974  float *A1, int lda1,
975  float *A2, int lda2,
976  const float *V, int ldv,
977  const float *T, int ldt);
978 void QUARK_CORE_stsmlq_sytra1(Quark *quark, Quark_Task_Flags *task_flags,
979  PLASMA_enum side, PLASMA_enum trans,
980  int m1, int n1, int m2, int n2, int k, int ib, int nb,
981  float *A1, int lda1,
982  float *A2, int lda2,
983  const float *V, int ldv,
984  const float *T, int ldt);
985 void QUARK_CORE_stsmlq_corner(Quark *quark, Quark_Task_Flags *task_flags,
986  int m1, int n1, int m2, int n2, int m3, int n3, int k, int ib, int nb,
987  float *A1, int lda1,
988  float *A2, int lda2,
989  float *A3, int lda3,
990  const float *V, int ldv,
991  const float *T, int ldt);
992 void QUARK_CORE_stsmqr(Quark *quark, Quark_Task_Flags *task_flags,
993  PLASMA_enum side, PLASMA_enum trans,
994  int m1, int n1, int m2, int n2, int k, int ib, int nb,
995  float *A1, int lda1,
996  float *A2, int lda2,
997  const float *V, int ldv,
998  const float *T, int ldt);
999 void QUARK_CORE_stsmqr_sytra1(Quark *quark, Quark_Task_Flags *task_flags,
1000  PLASMA_enum side, PLASMA_enum trans,
1001  int m1, int n1, int m2, int n2, int k, int ib, int nb,
1002  float *A1, int lda1,
1003  float *A2, int lda2,
1004  const float *V, int ldv,
1005  const float *T, int ldt);
1006 void QUARK_CORE_stsmqr_corner(Quark *quark, Quark_Task_Flags *task_flags,
1007  int m1, int n1, int m2, int n2, int m3, int n3, int k, int ib, int nb,
1008  float *A1, int lda1,
1009  float *A2, int lda2,
1010  float *A3, int lda3,
1011  const float *V, int ldv,
1012  const float *T, int ldt);
1013 void QUARK_CORE_stsqrt(Quark *quark, Quark_Task_Flags *task_flags,
1014  int m, int n, int ib, int nb,
1015  float *A1, int lda1,
1016  float *A2, int lda2,
1017  float *T, int ldt);
1018 void QUARK_CORE_ststrf(Quark *quark, Quark_Task_Flags *task_flags,
1019  int m, int n, int ib, int nb,
1020  float *U, int ldu,
1021  float *A, int lda,
1022  float *L, int ldl,
1023  int *IPIV,
1024  PLASMA_sequence *sequence, PLASMA_request *request,
1025  PLASMA_bool check_info, int iinfo);
1026 void QUARK_CORE_sttmqr(Quark *quark, Quark_Task_Flags *task_flags,
1027  PLASMA_enum side, PLASMA_enum trans,
1028  int m1, int n1, int m2, int n2, int k, int ib, int nb,
1029  float *A1, int lda1,
1030  float *A2, int lda2,
1031  const float *V, int ldv,
1032  const float *T, int ldt);
1033 void QUARK_CORE_sttqrt(Quark *quark, Quark_Task_Flags *task_flags,
1034  int m, int n, int ib, int nb,
1035  float *A1, int lda1,
1036  float *A2, int lda2,
1037  float *T, int ldt);
1038 void QUARK_CORE_sttmlq(Quark *quark, Quark_Task_Flags *task_flags,
1039  PLASMA_enum side, PLASMA_enum trans,
1040  int m1, int n1, int m2, int n2, int k, int ib, int nb,
1041  float *A1, int lda1,
1042  float *A2, int lda2,
1043  const float *V, int ldv,
1044  const float *T, int ldt);
1045 void QUARK_CORE_sttlqt(Quark *quark, Quark_Task_Flags *task_flags,
1046  int m, int n, int ib, int nb,
1047  float *A1, int lda1,
1048  float *A2, int lda2,
1049  float *T, int ldt);
1050 void QUARK_CORE_spamm(Quark *quark, Quark_Task_Flags *task_flags,
1051  int op, PLASMA_enum side, PLASMA_enum storev,
1052  int m, int n, int k, int l,
1053  const float *A1, int lda1,
1054  float *A2, int lda2,
1055  const float *V, int ldv,
1056  float *W, int ldw);
1057 void QUARK_CORE_splssq( Quark *quark, Quark_Task_Flags *task_flags,
1058  int m, const float *A, float *result );
1059 void QUARK_CORE_sormlq(Quark *quark, Quark_Task_Flags *task_flags,
1060  PLASMA_enum side, PLASMA_enum trans,
1061  int m, int n, int ib, int nb, int k,
1062  const float *A, int lda,
1063  const float *T, int ldt,
1064  float *C, int ldc);
1065 void QUARK_CORE_sormqr(Quark *quark, Quark_Task_Flags *task_flags,
1066  PLASMA_enum side, PLASMA_enum trans,
1067  int m, int n, int k, int ib, int nb,
1068  const float *A, int lda,
1069  const float *T, int ldt,
1070  float *C, int ldc);
1071 
1072 
1073 void QUARK_CORE_slascl(Quark *quark, Quark_Task_Flags *task_flags,
1074  PLASMA_enum type, int kl, int ku, float cfrom, float cto,
1075  int m, int n, float *A, int lda);
1076 void QUARK_CORE_slascl_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
1077  PLASMA_enum type, int kl, int ku, float *cfrom, float *cto,
1078  int m, int n, float *A, int lda,
1079  void *fake, int szefake, int flag);
1080 void QUARK_CORE_slaed0_lascl( Quark *quark, Quark_Task_Flags *task_flags,
1081  int n, float *scale, float *D, float *E);
1082 void QUARK_CORE_slaed0_betaapprox(Quark *quark, Quark_Task_Flags *task_flags,
1083  int subpbs, const int *subpbs_info,
1084  float *D, const float *E);
1085 
1086 #ifndef COMPLEX
1087 void QUARK_CORE_slaed2_computeK(Quark *quark, Quark_Task_Flags *task_flags,
1088  int *K1, int n, int n1,
1089  float *beta, float *D, float *Q, int LDQ,
1090  float *Z, float *DLAMBDA, float *W,
1091  int *INDX, int *INDXC, int *INDXP, int *INDXQ,
1092  int *COLTYP,
1093  float **Qmerge, int wsmode,
1094  int *K2);
1095 
1096 void QUARK_CORE_slaed1_pipelined(Quark *quark, Quark_Task_Flags *task_flags,
1097  int n, int n1, const int *K,
1098  const int *INDX, const int *ctot,
1099  float *D, const float *beta,
1100  float *Q, int LDQ, float *Q2,
1101  const float *DLAMBDA, const float *W, float *Wred,
1102  int start, int end);
1103 void QUARK_CORE_slaed2_compressq(Quark *quark, Quark_Task_Flags *task_flags,
1104  int n, int n1, int start, int end,
1105  const int *INDX, const int *ctot,
1106  const float *Q, int LDQ,
1107  float *Q2, int *K);
1108 void QUARK_CORE_slaed4_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
1109  int n, const int *K,
1110  float *D, const float *beta,
1111  float **Q, const int *LDQ,
1112  const float *DLAMBDA, const float *W, const int *INDX,
1113  int start, int end,
1114  PLASMA_sequence *sequence, PLASMA_request *request,
1115  void *fakeQ, int flagfQ);
1116 void QUARK_CORE_slaed3_compW_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
1117  int n, const int *K,
1118  float **Q, const int *LDQ,
1119  const float *DLAMBDA, float *W,
1120  const int *INDX,
1121  int start, int end,
1122  void *fakeQ, int flagfQ,
1123  void *fakeW, int flagfW);
1124 
1125 void QUARK_CORE_slaed3_reduceW(Quark *quark, Quark_Task_Flags *task_flags,
1126  int n, int n1, const int *K, int l,
1127  const float *Q, int LDQ,
1128  const float *Wred, float *W);
1129 void QUARK_CORE_slaed3_reduceW_p2(Quark *quark, Quark_Task_Flags *task_flags,
1130  int n, int n1, const int *K, int l,
1131  float **Q, const int *LDQ,
1132  const float *Wred, float *W);
1133 
1134 void QUARK_CORE_slaed2_copydef(Quark *quark, Quark_Task_Flags *task_flags,
1135  int n, int n1, const int *K, const int *ctot,
1136  float *Q, int LDQ, const float *Q2,
1137  int start, int end);
1138 void QUARK_CORE_slaed3_computevectors(Quark *quark, Quark_Task_Flags *task_flags,
1139  int wsmode, int n, const int *K,
1140  const int *il_nondef, const int *iu_nondef,
1141  float *Q, int LDQ, float *W, const int *INDXC,
1142  float **WSglobal, float **WSlocal,
1143  int start, int end );
1144 void QUARK_CORE_slaed3_wscopy( Quark *quark, Quark_Task_Flags *task_flags,
1145  const int *K, const int *il_nondef, const int *iu_nondef,
1146  const float *Q, int LDQ, float **WORK,
1147  int start, int end );
1148 void QUARK_CORE_slaed3_updatevectors(Quark *quark, Quark_Task_Flags *task_flags,
1149  int oper, int wsmode, int n, int n1, int *K,
1150  int *il_nondef, int *iu_nondef,
1151  float *D, float *Q, int LDQ, float *Q2,
1152  int *INDXQ, int *COLTYP, float **WORK,
1153  int start, int end, float **WORKDEP);
1154 void QUARK_CORE_slaed3_pipelined(Quark *quark, Quark_Task_Flags *task_flags,
1155  int n, int n1, int *K, int *il_nondef, int *iu_nondef,
1156  float *D, float *Q, int LDQ, float *Q2,
1157  int *INDXC, int *INDXQ, int *COLTYP, float *W,
1158  int start, int end2);
1159 
1160 void QUARK_CORE_sDC_fakedep(Quark *quark, Quark_Task_Flags *task_flags,
1161  int nb_tasks, int nb, float *Q, int LDQ, float *W);
1162 #endif
1163 
1164 void QUARK_CORE_sswap(Quark *quark, Quark_Task_Flags *task_flags,
1165  int m, int n, float *Q,
1166  int LDQ, float *work,
1167  int *perm, int begin, int end);
1168 #ifdef COMPLEX
1169 void QUARK_CORE_slag2c(Quark *quark, Quark_Task_Flags *task_flags,
1170  int m, int n,
1171  const float *Q, int LDQ,
1172  float *Z, int LDZ);
1173 #endif
1174 void QUARK_CORE_slaed3_freebigwork(Quark *quark, Quark_Task_Flags *task_flags,
1175  int *K_bis, int largework, float **WORK);
1176 void QUARK_CORE_slaset_identity(Quark *quark, Quark_Task_Flags *task_flags,
1177  int n, int start, int size,
1178  float *A);
1179 
1183 void CORE_sasum_quark(Quark *quark);
1184 void CORE_sasum_f1_quark(Quark *quark);
1185 void CORE_sgeadd_quark(Quark *quark);
1186 void CORE_sbrdalg1_quark(Quark *quark);
1187 void CORE_sgelqt_quark(Quark *quark);
1188 void CORE_sgemm_quark(Quark *quark);
1189 void CORE_sgemm_tile_quark(Quark *quark);
1190 void CORE_sgemv_quark(Quark *quark);
1191 void CORE_sgemv_tile_quark(Quark *quark);
1192 void CORE_sgeqp3_init_quark(Quark *quark);
1193 void CORE_sgeqp3_larfg_quark(Quark *quark);
1194 void CORE_sgeqp3_norms_quark(Quark *quark);
1195 void CORE_sgeqp3_pivot_quark(Quark *quark);
1196 void CORE_sgeqp3_tntpiv_quark(Quark *quark);
1197 void CORE_sgeqp3_update_quark(Quark *quark);
1198 void CORE_sgeqrt_quark(Quark *quark);
1199 void CORE_sgessm_quark(Quark *quark);
1200 void CORE_sgessq_quark(Quark *quark);
1201 void CORE_sgessq_f1_quark(Quark *quark);
1202 void CORE_sgetrf_quark(Quark *quark);
1203 void CORE_sgetrf_incpiv_quark(Quark *quark);
1204 void CORE_sgetrf_nopiv_quark(Quark* quark);
1205 void CORE_sgetrf_reclap_quark(Quark *quark);
1206 void CORE_sgetrf_rectil_quark(Quark* quark);
1207 void CORE_sgetrip_quark(Quark *quark);
1208 void CORE_sgetrip_f1_quark(Quark *quark);
1209 void CORE_sgetrip_f2_quark(Quark *quark);
1210 #ifdef COMPLEX
1211 void CORE_ssymm_quark(Quark *quark);
1212 void CORE_ssyrk_quark(Quark *quark);
1213 void CORE_ssyr2k_quark(Quark *quark);
1214 #endif
1215 void CORE_ssygst_quark(Quark *quark);
1216 void CORE_ssyrfb_quark(Quark *quark);
1217 void CORE_shessq_quark(Quark *quark);
1218 void CORE_shessq_f1_quark(Quark *quark);
1219 void CORE_slacpy_quark(Quark *quark);
1220 void CORE_slacpy_f1_quark(Quark *quark);
1221 void CORE_slacpy_pivot_quark(Quark *quark);
1222 void CORE_slatro_quark(Quark *quark);
1223 void CORE_slatro_f1_quark(Quark *quark);
1224 void CORE_slange_quark(Quark *quark);
1225 void CORE_slange_f1_quark(Quark *quark);
1226 #ifdef COMPLEX
1227 void CORE_slansy_quark(Quark *quark);
1228 void CORE_slansy_f1_quark(Quark *quark);
1229 #endif
1230 void CORE_slansy_quark(Quark *quark);
1231 void CORE_slansy_f1_quark(Quark *quark);
1232 void CORE_slaset_quark(Quark *quark);
1233 void CORE_slaset2_quark(Quark *quark);
1234 void CORE_slatro_quark(Quark *quark);
1235 void CORE_slauum_quark(Quark *quark);
1236 void CORE_spamm_quark(Quark *quark);
1237 void CORE_splgsy_quark(Quark *quark);
1238 void CORE_splgsy_quark(Quark *quark);
1239 void CORE_splrnt_quark(Quark *quark);
1240 void CORE_spltmg_quark(Quark *quark);
1241 void CORE_splssq_quark(Quark *quark);
1242 void CORE_spotrf_quark(Quark *quark);
1243 void CORE_ssetvar_quark(Quark *quark);
1244 void CORE_sshift_quark(Quark *quark);
1245 void CORE_sshiftw_quark(Quark *quark);
1246 void CORE_sssssm_quark(Quark *quark);
1247 void CORE_ssymm_quark(Quark *quark);
1248 void CORE_ssyrk_quark(Quark *quark);
1249 void CORE_ssyr2k_quark(Quark *quark);
1250 void CORE_ssyssq_quark(Quark *quark);
1251 void CORE_ssyssq_f1_quark(Quark *quark);
1252 void CORE_sswpab_quark(Quark *quark);
1253 void CORE_sswptr_ontile_quark(Quark *quark);
1254 void CORE_strdalg1_quark(Quark *quark);
1255 void CORE_strmm_quark(Quark *quark);
1256 void CORE_strsm_quark(Quark *quark);
1257 void CORE_strtri_quark(Quark *quark);
1258 void CORE_stslqt_quark(Quark *quark);
1259 void CORE_stsmlq_quark(Quark *quark);
1260 void CORE_stsmlq_sytra1_quark(Quark *quark);
1261 void CORE_stsmlq_corner_quark(Quark *quark);
1262 void CORE_stsmqr_quark(Quark *quark);
1263 void CORE_stsmqr_sytra1_quark(Quark *quark);
1264 void CORE_stsmqr_corner_quark(Quark *quark);
1265 void CORE_stsqrt_quark(Quark *quark);
1266 void CORE_ststrf_quark(Quark *quark);
1267 void CORE_sttmqr_quark(Quark *quark);
1268 void CORE_sttqrt_quark(Quark *quark);
1269 void CORE_sttmlq_quark(Quark *quark);
1270 void CORE_sttlqt_quark(Quark *quark);
1271 void CORE_sormlq_quark(Quark *quark);
1272 void CORE_sormqr_quark(Quark *quark);
1273 void CORE_slaswp_quark(Quark* quark);
1274 void CORE_slaswp_f2_quark(Quark* quark);
1275 void CORE_slaswp_ontile_quark(Quark *quark);
1276 void CORE_slaswp_ontile_f2_quark(Quark *quark);
1277 void CORE_slaswpc_ontile_quark(Quark *quark);
1278 void CORE_strmm_p2_quark(Quark* quark);
1279 void CORE_sgemm_f2_quark(Quark* quark);
1280 void CORE_sgemm_p2_quark(Quark* quark);
1281 void CORE_sgemm_p2f1_quark(Quark* quark);
1282 void CORE_sgemm_p3_quark(Quark* quark);
1283 
1284 #endif /* defined(QUARK_H) */
1285 
1286 #ifdef __cplusplus
1287 }
1288 #endif
1289 
1290 #undef COMPLEX
1291 
1292 #endif
int CORE_sttqrt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sttqrt.c:116
int CORE_stsmlq(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_stsmlq.c:124
int CORE_sgetf2_nopiv(int m, int n, float *A, int lda)
Definition: core_sgetf2_nopiv.c:64
void CORE_spotrf(PLASMA_enum uplo, int N, float *A, int LDA, int *INFO)
Definition: core_spotrf.c:68
int CORE_slarfx2c(PLASMA_enum uplo, float V, float TAU, float *C1, float *C2, float *C3)
Definition: core_slarfx_tbrd.c:177
int CORE_sswptr_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc, const float *Akk, int ldak)
Definition: core_slaswp.c:224
void CORE_sgbtype1cb(PLASMA_enum uplo, int N, int NB, float *A, int LDA, float *VQ, float *TAUQ, float *VP, float *TAUP, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_sgbtype1cb.c:102
void CORE_strsm(PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag, int M, int N, float alpha, const float *A, int LDA, float *B, int LDB)
Definition: core_strsm.c:80
int CORE_sttmlq(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_sttmlq.c:116
int CORE_spltmg_chebvand(int M, int N, float *A, int LDA, int gN, int m0, int n0, float *W)
Definition: core_spltmg_chebvand.c:83
int CORE_spamm(int op, PLASMA_enum side, PLASMA_enum storev, int M, int N, int K, int L, const float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, float *W, int LDW)
Definition: core_spamm.c:175
void CORE_ssyrk(PLASMA_enum uplo, PLASMA_enum trans, int N, int K, float alpha, const float *A, int LDA, float beta, float *C, int LDC)
Definition: core_ssyrk.c:80
void CORE_ssbtype2cb(int N, int NB, float *A, int LDA, float *V, float *TAU, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_ssbtype2cb.c:101
void CORE_sgeqp3_larfg(PLASMA_desc A, int ii, int jj, int i, int j, float *tau, float *beta)
Definition: core_sgeqp3_larfg.c:78
int CORE_shbrce(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_shbrce.c:78
void CORE_sswap(int m, int n, float *Q, int ldq, const float *work, const int *perm, int start, int end)
Definition: core_sswap.c:67
int CORE_spltmg(PLASMA_enum mtxtype, int m, int n, float *A, int lda, int gM, int gN, int m0, int n0, unsigned long long int seed)
Definition: core_spltmg.c:90
int CORE_slaswp_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc)
Definition: core_slaswp.c:107
void CORE_slaset(PLASMA_enum uplo, int n1, int n2, float alpha, float beta, float *tileA, int ldtilea)
Definition: core_slaset.c:57
int CORE_ssyrfb(PLASMA_enum uplo, int N, int K, int IB, int NB, const float *A, int LDA, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_ssyrfb.c:110
int CORE_sgessm(int M, int N, int K, int IB, const int *IPIV, const float *L, int LDL, float *A, int LDA)
Definition: core_sgessm.c:70
int CORE_shblrx(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_shblrx.c:78
int CORE_slarfx2(PLASMA_enum side, int N, float V, float TAU, float *C1, int LDC1, float *C2, int LDC2)
Definition: core_slarfx_tbrd.c:82
void CORE_sgeqp3_pivot(PLASMA_desc A, float *F, int ldf, int jj, int k, int *jpvt, float *norms1, float *norms2, int *info)
Definition: core_sgeqp3_pivot.c:68
void CORE_sshiftw(int s, int cl, int m, int n, int L, float *A, float *W)
Definition: core_sshift.c:66
void CORE_strasm(PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag, int M, int N, const float *A, int lda, float *work)
Definition: core_strasm.c:66
void CORE_spltmg_condexq(int M, int N, float *Q, int LDQ)
Definition: core_spltmg_condex.c:53
void CORE_sgeqp3_update(const float *Ajj, int lda1, float *Ajk, int lda2, const float *Fk, int ldf, int joff, int k, int koff, int nb, float *norms1, float *norms2, int *info)
Definition: core_sgeqp3_update.c:82
void CORE_sgeqp3_norms(PLASMA_desc A, int ioff, int joff, float *norms1, float *norms2)
Definition: core_sgeqp3_norms.c:62
void CORE_ssygst(int itype, PLASMA_enum uplo, int N, float *A, int LDA, float *B, int LDB, int *INFO)
Definition: core_ssygst.c:80
void CORE_strmm(PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag, int M, int N, float alpha, const float *A, int LDA, float *B, int LDB)
Definition: core_strmm.c:84
void CORE_slantr(PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag, int M, int N, const float *A, int LDA, float *work, float *normA)
Definition: core_slantr.c:84
int CORE_sgetrf_incpiv(int M, int N, int IB, float *A, int LDA, int *IPIV, int *INFO)
Definition: core_sgetrf_incpiv.c:83
int CORE_stsmqr(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_stsmqr.c:124
void CORE_sbrdalg1(PLASMA_enum uplo, int n, int nb, float *A, int lda, float *VQ, float *TAUQ, float *VP, float *TAUP, int Vblksiz, int wantz, int i, int sweepid, int m, int grsiz, float *work)
Definition: core_sbrdalg1.c:111
int CORE_sparfb(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev, int M1, int N1, int M2, int N2, int K, int L, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_sparfb.c:132
int CORE_stsmqr_corner(int m1, int n1, int m2, int n2, int m3, int n3, int k, int ib, int nb, float *A1, int lda1, float *A2, int lda2, float *A3, int lda3, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmqr_corner.c:130
int CORE_sgbrce(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_sgbrce.c:78
int CORE_stsmlq_corner(int m1, int n1, int m2, int n2, int m3, int n3, int k, int ib, int nb, float *A1, int lda1, float *A2, int lda2, float *A3, int lda3, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmlq_corner.c:130
void CORE_ssbtype1cb(int N, int NB, float *A, int LDA, float *V, float *TAU, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_ssbtype1cb.c:97
int CORE_sttmqr(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_sttmqr.c:116
int CORE_sgeqrt(int M, int N, int IB, float *A, int LDA, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sgeqrt.c:86
void CORE_splrnt(int m, int n, float *A, int lda, int bigM, int m0, int n0, unsigned long long int seed)
Definition: core_splrnt.c:68
void CORE_slauum(PLASMA_enum uplo, int N, float *A, int LDA)
Definition: core_slauum.c:57
void CORE_ssbtype3cb(int N, int NB, float *A, int LDA, const float *V, const float *TAU, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_ssbtype3cb.c:98
void CORE_slange(int norm, int M, int N, const float *A, int LDA, float *work, float *normA)
Definition: core_slange.c:72
int CORE_slatro(PLASMA_enum uplo, PLASMA_enum trans, int M, int N, const float *A, int LDA, float *B, int LDB)
Definition: core_slatro.c:80
Definition: plasma.h:34
void CORE_strdalg1(int n, int nb, float *A, int lda, float *V, float *TAU, int Vblksiz, int wantz, int i, int sweepid, int m, int grsiz, float *work)
Definition: core_strdalg1.c:91
int CORE_slarfx2ce(PLASMA_enum uplo, float *V, float *TAU, float *C1, float *C2, float *C3)
Definition: core_slarfx_tbrd.c:323
int CORE_sgbelr(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_sgbelr.c:81
int CORE_stsmqr_sytra1(PLASMA_enum side, PLASMA_enum trans, int m1, int n1, int m2, int n2, int k, int ib, float *A1, int lda1, float *A2, int lda2, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmqr_sytra1.c:127
int CORE_slacpy_pivot(const PLASMA_desc descA, PLASMA_enum direct, int k1, int k2, const int *ipiv, int *rankin, int *rankout, float *A, int lda, int init)
Definition: core_slacpy_pivot.c:84
int CORE_spltmg_hankel(PLASMA_enum uplo, int M, int N, float *A, int LDA, int m0, int n0, int nb, const float *V1, const float *V2)
Definition: core_spltmg_hankel.c:88
void CORE_sgemm(PLASMA_enum transA, PLASMA_enum transB, int M, int N, int K, float alpha, const float *A, int LDA, const float *B, int LDB, float beta, float *C, int LDC)
Definition: core_sgemm.c:90
int CORE_sormqr(PLASMA_enum side, PLASMA_enum trans, int M, int N, int K, int IB, const float *V, int LDV, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_sormqr.c:108
void CORE_slaset2(PLASMA_enum uplo, int n1, int n2, float alpha, float *tileA, int ldtilea)
Definition: core_slaset2.c:55
int CORE_stslqt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_stslqt.c:107
void CORE_slarfy(int N, float *A, int LDA, const float *V, const float *TAU, float *WORK)
Definition: core_slarfy.c:61
int CORE_sgetrf_nopiv(int m, int n, int ib, float *A, int lda)
Definition: core_sgetrf_nopiv.c:69
void CORE_sgetrip(int m, int n, float *A, float *work)
Definition: core_sgetrip.c:51
int CORE_shbelr(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_shbelr.c:80
void CORE_spltmg_toeppd1(int gM, int m0, int M, float *W, unsigned long long int seed)
Definition: core_spltmg_toeppd.c:70
int CORE_sormlq(PLASMA_enum side, PLASMA_enum trans, int M, int N, int IB, int K, const float *V, int LDV, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_sormlq.c:108
int CORE_slascl(PLASMA_enum type, int kl, int ku, float cfrom, float cto, int m, int n, float *A, int lda)
Definition: core_slascl.c:72
int CORE_sttlqt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sttlqt.c:116
int CORE_sgetrf_reclap(int M, int N, float *A, int LDA, int *IPIV, int *info)
Definition: core_sgetrf_reclap.c:111
void CORE_splgsy(float bump, int m, int n, float *A, int lda, int bigM, int m0, int n0, unsigned long long int seed)
Definition: core_splgsy.c:72
void CORE_sgemv(PLASMA_enum trans, int M, int N, float alpha, const float *A, int LDA, const float *x, int incx, float beta, float *y, int incy)
Definition: core_sgemv.c:78
int CORE_slarfb_gemm(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev, int M, int N, int K, const float *V, int LDV, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_slarfb_gemm.c:113
void CORE_ssetvar(const float *alpha, float *x)
Definition: core_ssetvar.c:37
int CORE_stsmlq_sytra1(PLASMA_enum side, PLASMA_enum trans, int m1, int n1, int m2, int n2, int k, int ib, float *A1, int lda1, float *A2, int lda2, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmlq_sytra1.c:125
int CORE_slaswpc_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc)
Definition: core_slaswp.c:296
int CORE_spemv(PLASMA_enum trans, PLASMA_enum storev, int M, int N, int L, float ALPHA, const float *A, int LDA, const float *X, int INCX, float BETA, float *Y, int INCY, float *WORK)
Definition: core_spemv.c:118
int CORE_sgelqt(int M, int N, int IB, float *A, int LDA, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sgelqt.c:85
Definition: plasma.h:24
void CORE_sgbtype2cb(PLASMA_enum uplo, int N, int NB, float *A, int LDA, float *VQ, float *TAUQ, float *VP, float *TAUP, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_sgbtype2cb.c:105
void CORE_slaswp(int N, float *A, int LDA, int I1, int I2, const int *IPIV, int INC)
Definition: core_slaswp.c:62
int CORE_stsqrt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_stsqrt.c:97
void CORE_strtri(PLASMA_enum uplo, PLASMA_enum diag, int N, float *A, int LDA, int *info)
Definition: core_strtri.c:66
void CORE_ssymm(PLASMA_enum side, PLASMA_enum uplo, int M, int N, float alpha, const float *A, int LDA, const float *B, int LDB, float beta, float *C, int LDC)
Definition: core_ssymm.c:88
void CORE_sasum(int storev, PLASMA_enum uplo, int M, int N, const float *A, int lda, float *work)
Definition: core_sasum.c:61
int CORE_sssssm(int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *L1, int LDL1, const float *L2, int LDL2, const int *IPIV)
Definition: core_sssssm.c:94
void CORE_slacpy(PLASMA_enum uplo, int M, int N, const float *A, int LDA, float *B, int LDB)
Definition: core_slacpy.c:59
Definition: descriptor.h:41
void CORE_spltmg_fiedler(int m, int n, const float *X, int incX, const float *Y, int incY, float *A, int lda)
Definition: core_spltmg_fiedler.c:75
int CORE_sgetrf_rectil(const PLASMA_desc A, int *IPIV, int *info)
Definition: core_sgetrf_rectil.c:110
void CORE_slansy(int norm, PLASMA_enum uplo, int N, const float *A, int LDA, float *work, float *normA)
Definition: core_slansy.c:74
void CORE_spltmg_toeppd2(int M, int N, int K, int m0, int n0, const float *W, float *A, int LDA)
Definition: core_spltmg_toeppd.c:149
int CORE_spltmg_circul(int M, int N, float *A, int LDA, int gM, int m0, int n0, const float *V)
Definition: core_spltmg_circul.c:76
int CORE_sgblrx(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_sgblrx.c:80
void CORE_sswpab(int i, int n1, int n2, float *A, float *work)
Definition: core_sswpab.c:63
int CORE_sgeadd(int M, int N, float alpha, const float *A, int LDA, float *B, int LDB)
Definition: core_sgeadd.c:59
int CORE_ststrf(int M, int N, int IB, int NB, float *U, int LDU, float *A, int LDA, float *L, int LDL, int *IPIV, float *WORK, int LDWORK, int *INFO)
Definition: core_ststrf.c:99
void CORE_sgeqp3_init(int n, int *jpvt)
Definition: core_sgeqp3_init.c:38
void CORE_ssyr2k(PLASMA_enum uplo, PLASMA_enum trans, int N, int K, float alpha, const float *A, int LDA, const float *B, int LDB, float beta, float *C, int LDC)
Definition: core_ssyr2k.c:90
void CORE_sgbtype3cb(PLASMA_enum uplo, int N, int NB, float *A, int LDA, float *VQ, float *TAUQ, float *VP, float *TAUP, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_sgbtype3cb.c:103
int CORE_sgetrf(int M, int N, float *A, int LDA, int *IPIV, int *INFO)
Definition: core_sgetrf.c:60