18 #ifndef _PLASMA_CORE_SBLAS_H_
19 #define _PLASMA_CORE_SBLAS_H_
30 void CORE_sasum(
int storev, PLASMA_enum uplo,
int M,
int N,
31 const float *A,
int lda,
float *work);
41 int Vblksiz,
int wantz,
42 int i,
int sweepid,
int m,
int grsiz,
46 int st,
int ed,
int eltsize);
49 int st,
int ed,
int eltsize);
52 int st,
int ed,
int eltsize);
54 const float *A,
int LDA,
61 void CORE_sgemm(PLASMA_enum transA, PLASMA_enum transB,
63 float alpha,
const float *A,
int LDA,
64 const float *B,
int LDB,
65 float beta,
float *C,
int LDC);
66 void CORE_sgemv(PLASMA_enum trans,
int M,
int N,
67 float alpha,
const float *A,
int LDA,
68 const float *x,
int incx,
69 float beta,
float *y,
int incy);
72 float *tau,
float *beta );
75 int jj,
int k,
int *jpvt,
76 float *norms1,
float *norms2,
int *info );
77 int CORE_sgeqp3_tntpiv(
int m,
int n,
79 int *IPIV,
float *tau,
83 const float *Fk,
int ldf,
84 int joff,
int k,
int koff,
int nb,
85 float *norms1,
float *norms2,
90 float *TAU,
float *WORK);
93 const float *L,
int LDL,
95 int CORE_sgessq(
int M,
int N,
96 const float *A,
int LDA,
97 float *scale,
float *sumsq);
102 int *IPIV,
int *INFO);
105 int *IPIV,
int *INFO);
110 int *IPIV,
int *info);
111 void CORE_sgetrf_reclap_init(
void);
113 void CORE_sgetrf_rectil_init(
void);
118 int st,
int ed,
int eltsize);
121 int st,
int ed,
int eltsize);
124 int st,
int ed,
int eltsize);
127 float *V,
float *TAU,
128 int st,
int ed,
int sweep,
int Vblksiz,
int WANTZ,
132 float *V,
float *TAU,
133 int st,
int ed,
int sweep,
int Vblksiz,
int WANTZ,
137 const float *V,
const float *TAU,
138 int st,
int ed,
int sweep,
int Vblksiz,
int WANTZ,
142 float *VQ,
float *TAUQ,
143 float *VP,
float *TAUP,
144 int st,
int ed,
int sweep,
int Vblksiz,
int WANTZ,
148 float *VQ,
float *TAUQ,
149 float *VP,
float *TAUP,
150 int st,
int ed,
int sweep,
int Vblksiz,
int WANTZ,
154 float *VQ,
float *TAUQ,
155 float *VP,
float *TAUP,
156 int st,
int ed,
int sweep,
int Vblksiz,
int WANTZ,
158 void CORE_ssygst(
int itype, PLASMA_enum uplo,
int N,
160 float *B,
int LDB,
int *INFO);
162 void CORE_ssymm(PLASMA_enum side, PLASMA_enum uplo,
164 float alpha,
const float *A,
int LDA,
165 const float *B,
int LDB,
166 float beta,
float *C,
int LDC);
167 void CORE_ssyrk(PLASMA_enum uplo, PLASMA_enum trans,
169 float alpha,
const float *A,
int LDA,
170 float beta,
float *C,
int LDC);
171 void CORE_ssyr2k(PLASMA_enum uplo, PLASMA_enum trans,
173 float alpha,
const float *A,
int LDA,
174 const float *B,
int LDB,
175 float beta,
float *C,
int LDC);
176 int CORE_shessq(PLASMA_enum uplo,
int N,
177 const float *A,
int LDA,
178 float *scale,
float *sumsq);
180 int CORE_ssyrfb(PLASMA_enum uplo,
int N,
int K,
int IB,
int NB,
181 const float *A,
int LDA,
182 const float *T,
int LDT,
184 float *WORK,
int LDWORK);
186 const float *A,
int LDA,
190 int k1,
int k2,
const int *ipiv,
191 int *rankin,
int *rankout,
195 const float *A,
int LDA,
196 float *work,
float *normA);
198 void CORE_slansy(
int norm, PLASMA_enum uplo,
int N,
199 const float *A,
int LDA,
200 float *work,
float *normA);
202 void CORE_slansy(
int norm, PLASMA_enum uplo,
int N,
203 const float *A,
int LDA,
204 float *work,
float *normA);
205 void CORE_slantr(PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag,
207 const float *A,
int LDA,
208 float *work,
float *normA);
209 int CORE_slarfb_gemm(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev,
211 const float *V,
int LDV,
212 const float *T,
int LDT,
214 float *WORK,
int LDWORK);
219 float *C2,
int LDC2);
238 float alpha,
float beta,
239 float *tileA,
int ldtilea);
240 void CORE_slaset2(PLASMA_enum uplo,
int n1,
int n2,
float alpha,
241 float *tileA,
int ldtilea);
243 int I1,
int I2,
const int *IPIV,
int INC);
246 int CORE_slatro(PLASMA_enum uplo, PLASMA_enum trans,
248 const float *A,
int LDA,
250 void CORE_slauum(PLASMA_enum uplo,
int N,
float *A,
int LDA);
251 int CORE_spamm(
int op, PLASMA_enum side, PLASMA_enum storev,
252 int M,
int N,
int K,
int L,
253 const float *A1,
int LDA1,
255 const float *V,
int LDV,
257 int CORE_sparfb(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev,
258 int M1,
int N1,
int M2,
int N2,
int K,
int L,
261 const float *V,
int LDV,
262 const float *T,
int LDT,
263 float *WORK,
int LDWORK);
264 int CORE_spemv(PLASMA_enum trans, PLASMA_enum storev,
267 const float *A,
int LDA,
268 const float *X,
int INCX,
272 void CORE_splgsy(
float bump,
int m,
int n,
float *A,
int lda,
273 int bigM,
int m0,
int n0,
unsigned long long int seed );
274 void CORE_splgsy(
float bump,
int m,
int n,
float *A,
int lda,
275 int bigM,
int m0,
int n0,
unsigned long long int seed );
277 int bigM,
int m0,
int n0,
unsigned long long int seed );
278 int CORE_spltmg(PLASMA_enum mtxtype,
int m,
int n,
float *A,
int lda,
279 int gM,
int gN,
int m0,
int n0,
unsigned long long int seed );
281 int gN,
int m0,
int n0,
284 int gM,
int m0,
int n0,
288 const float *X,
int incX,
289 const float *Y,
int incY,
292 int m0,
int n0,
int nb,
296 unsigned long long int seed );
300 void CORE_spotrf(PLASMA_enum uplo,
int N,
float *A,
int LDA,
int *INFO);
302 void CORE_sshift(
int s,
int m,
int n,
int L,
306 int CORE_sssssm(
int M1,
int N1,
int M2,
int N2,
int K,
int IB,
309 const float *L1,
int LDL1,
310 const float *L2,
int LDL2,
312 int CORE_sstedc(PLASMA_enum compz,
int n,
315 float *WORK,
int LWORK,
317 float *RWORK,
int LRWORK,
319 int *IWORK,
int LIWORK);
320 int CORE_ssteqr(PLASMA_enum compz,
int n,
324 void CORE_ssymm(PLASMA_enum side, PLASMA_enum uplo,
326 float alpha,
const float *A,
int LDA,
327 const float *B,
int LDB,
328 float beta,
float *C,
int LDC);
329 void CORE_ssyrk(PLASMA_enum uplo, PLASMA_enum trans,
331 float alpha,
const float *A,
int LDA,
332 float beta,
float *C,
int LDC);
333 void CORE_ssyr2k(PLASMA_enum uplo, PLASMA_enum trans,
335 float alpha,
const float *A,
int LDA,
336 const float *B,
int LDB,
337 float beta,
float *C,
int LDC);
338 int CORE_ssyssq(PLASMA_enum uplo,
int N,
339 const float *A,
int LDA,
340 float *scale,
float *sumsq);
342 float *A,
float *work);
344 const float *Akk,
int ldak);
345 void CORE_strasm(PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag,
346 int M,
int N,
const float *A,
int lda,
float *work);
353 int Vblksiz,
int wantz,
354 int i,
int sweepid,
int m,
int grsiz,
356 void CORE_strmm(PLASMA_enum side, PLASMA_enum uplo,
357 PLASMA_enum transA, PLASMA_enum diag,
359 float alpha,
const float *A,
int LDA,
361 void CORE_strsm(PLASMA_enum side, PLASMA_enum uplo,
362 PLASMA_enum transA, PLASMA_enum diag,
364 float alpha,
const float *A,
int LDA,
366 int CORE_strssq(PLASMA_enum uplo, PLASMA_enum diag,
int M,
int N,
367 const float *A,
int LDA,
368 float *scale,
float *sumsq);
369 void CORE_strtri(PLASMA_enum uplo, PLASMA_enum diag,
int N,
370 float *A,
int LDA,
int *info);
375 float *TAU,
float *WORK);
376 int CORE_stsmlq(PLASMA_enum side, PLASMA_enum trans,
377 int M1,
int N1,
int M2,
int N2,
int K,
int IB,
380 const float *V,
int LDV,
381 const float *T,
int LDT,
382 float *WORK,
int LDWORK);
384 int k,
int ib,
int nb,
388 const float *V,
int ldv,
389 const float *T,
int ldt,
390 float *WORK,
int ldwork);
392 int m1,
int n1,
int m2,
int n2,
396 const float *V,
int ldv,
397 const float *T,
int ldt,
398 float *WORK,
int ldwork);
399 int CORE_stsmqr(PLASMA_enum side, PLASMA_enum trans,
400 int M1,
int N1,
int M2,
int N2,
int K,
int IB,
403 const float *V,
int LDV,
404 const float *T,
int LDT,
405 float *WORK,
int LDWORK);
407 int k,
int ib,
int nb,
411 const float *V,
int ldv,
412 const float *T,
int ldt,
413 float *WORK,
int ldwork);
415 int m1,
int n1,
int m2,
int n2,
419 const float *V,
int ldv,
420 const float *T,
int ldt,
421 float *WORK,
int ldwork);
426 float *TAU,
float *WORK);
431 int *IPIV,
float *WORK,
432 int LDWORK,
int *INFO);
433 int CORE_sttmqr(PLASMA_enum side, PLASMA_enum trans,
434 int M1,
int N1,
int M2,
int N2,
int K,
int IB,
437 const float *V,
int LDV,
438 const float *T,
int LDT,
439 float *WORK,
int LDWORK);
446 int CORE_sttmlq(PLASMA_enum side, PLASMA_enum trans,
447 int M1,
int N1,
int M2,
int N2,
int K,
int IB,
450 const float *V,
int LDV,
451 const float *T,
int LDT,
452 float *WORK,
int LDWORK);
459 int CORE_sormlq(PLASMA_enum side, PLASMA_enum trans,
460 int M,
int N,
int IB,
int K,
461 const float *V,
int LDV,
462 const float *T,
int LDT,
464 float *WORK,
int LDWORK);
465 int CORE_sormqr(PLASMA_enum side, PLASMA_enum trans,
466 int M,
int N,
int K,
int IB,
467 const float *V,
int LDV,
468 const float *T,
int LDT,
470 float *WORK,
int LDWORK);
473 void CORE_slaed2_computeK(
int *K,
int n,
int n1,
474 float *beta,
float *D,
float *Q,
int LDQ,
475 float *Z,
float *DLAMBDA,
float *W,
476 int *INDX,
int *INDXC,
int *INDXP,
int *INDXQ,
478 void CORE_slaed2_compressq(
int n,
int n1,
const int *INDX,
const int *ctot,
479 const float *Q,
int LDQ,
float *Q2,
481 void CORE_slaed2_copydef(
int n,
int n1,
int K,
const int *ctot,
482 float *Q,
int LDQ,
const float *Q2,
484 int CORE_slaed4(
int n,
int K,
485 float *D,
float beta,
487 const float *D0,
const float *Z,
489 int start,
int end );
490 void CORE_slaed3_computeW(
int n,
int K,
491 const float *Q,
int LDQ,
492 const float *DLAMBDA,
float *W,
495 void CORE_slaed3_reduceW(
int n,
int n1,
int K,
int l,
496 const float *Q,
int LDQ,
497 const float *Wred,
float *W);
498 void CORE_slaed3_computevectors(
int K,
int il_nondef,
int iu_nondef,
499 float *Q,
int LDQ,
float *W,
float *S,
502 void CORE_slaed3_merge(
int n,
int K,
float *D,
int *INDXQ );
503 void CORE_slaed3_updatevectors(
int op,
int wsmode,
int n,
int n1,
int K,
504 int il_nondef,
int iu_nondef,
505 float *Q,
int ldq,
float *Q2,
506 const int *ctot,
float *WORK,
int start,
int end);
508 void CORE_sswap(
int m,
int n,
float *Q,
int ldq,
509 const float *work,
const int *perm,
511 int CORE_slascl(PLASMA_enum type,
int kl,
int ku,
float cfrom,
float cto,
512 int m,
int n,
float *A,
int lda);
514 int CORE_slag2c(
int m,
int n,
const float *Q,
int LDQ,
519 void CORE_slaed3_freebigwork(
int oper,
float **WORK);
520 void CORE_slaed0_betaapprox(
int subpbs,
const int *subpbs_info,
521 float *D,
const float *E);
522 int CORE_slapst(PLASMA_enum type,
int n,
523 const float *D,
int *INDX);
530 void QUARK_CORE_sasum(Quark *quark, Quark_Task_Flags *task_flags,
531 PLASMA_enum storev, PLASMA_enum uplo,
int m,
int n,
532 const float *A,
int lda,
int szeA,
533 float *work,
int szeW);
534 void QUARK_CORE_sasum_f1(Quark *quark, Quark_Task_Flags *task_flags,
535 PLASMA_enum storev, PLASMA_enum uplo,
int m,
int n,
536 const float *A,
int lda,
int szeA,
537 float *work,
int szeW,
538 float *fake,
int szeF);
539 void QUARK_CORE_sgeadd(Quark *quark, Quark_Task_Flags *task_flags,
540 int m,
int n,
int nb,
float alpha,
541 const float *A,
int lda,
543 void QUARK_CORE_sbrdalg1(Quark *quark, Quark_Task_Flags *task_flags,
552 int Vblksiz,
int wantz,
553 int i,
int sweepid,
int m,
int grsiz,
554 int *PCOL,
int *ACOL,
int *MCOL);
555 void QUARK_CORE_sgelqt(Quark *quark, Quark_Task_Flags *task_flags,
556 int m,
int n,
int ib,
int nb,
559 void QUARK_CORE_sgemm(Quark *quark, Quark_Task_Flags *task_flags,
560 PLASMA_enum transA, PLASMA_enum transB,
561 int m,
int n,
int k,
int nb,
562 float alpha,
const float *A,
int lda,
563 const float *B,
int ldb,
564 float beta,
float *C,
int ldc);
565 void QUARK_CORE_sgemm2( Quark *quark, Quark_Task_Flags *task_flags,
566 PLASMA_enum transA, PLASMA_enum transB,
567 int m,
int n,
int k,
int nb,
568 float alpha,
const float *A,
int lda,
569 const float *B,
int ldb,
570 float beta,
float *C,
int ldc);
571 void QUARK_CORE_sgemm_f2(Quark *quark, Quark_Task_Flags *task_flags,
572 PLASMA_enum transA, PLASMA_enum transB,
573 int m,
int n,
int k,
int nb,
574 float alpha,
const float *A,
int lda,
575 const float *B,
int ldb,
576 float beta,
float *C,
int ldc,
577 float *fake1,
int szefake1,
int flag1,
578 float *fake2,
int szefake2,
int flag2);
579 void QUARK_CORE_sgemm_p2(Quark *quark, Quark_Task_Flags *task_flags,
580 PLASMA_enum transA, PLASMA_enum transB,
581 int m,
int n,
int k,
int nb,
582 float alpha,
const float *A,
int lda,
583 const float **B,
int ldb,
584 float beta,
float *C,
int ldc);
585 void QUARK_CORE_sgemm_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
586 PLASMA_enum transA, PLASMA_enum transB,
587 int m,
int n,
int k,
int nb,
588 float alpha,
const float *A,
int lda,
589 const float **B,
int ldb,
590 float beta,
float *C,
int ldc,
591 float *fake1,
int szefake1,
int flag1);
592 void QUARK_CORE_sgemm_p3(Quark *quark, Quark_Task_Flags *task_flags,
593 PLASMA_enum transA, PLASMA_enum transB,
594 int m,
int n,
int k,
int nb,
595 float alpha,
const float *A,
int lda,
596 const float *B,
int ldb,
597 float beta,
float **C,
int ldc);
598 void QUARK_CORE_sgemm_tile(Quark *quark, Quark_Task_Flags *task_flags,
599 PLASMA_enum transA, PLASMA_enum transB,
600 int m,
int n,
int k,
int nb,
601 const float *alpha,
const float *A,
int lda,
602 const float *B,
int ldb,
603 const float *beta,
float *C,
int ldc,
607 void QUARK_CORE_sgemv(Quark *quark, Quark_Task_Flags *task_flags,
608 PLASMA_enum trans,
int m,
int n,
609 float alpha,
const float *A,
int lda,
610 const float *x,
int incx,
611 float beta,
float *y,
int incy);
612 void QUARK_CORE_sgemv_tile(Quark *quark, Quark_Task_Flags *task_flags,
615 const float *alpha,
const float *A,
int lda,
616 const float *x,
int incx,
617 const float *beta,
float *y,
int incy,
621 void QUARK_CORE_sgeqp3_init( Quark *quark, Quark_Task_Flags *task_flags,
623 void QUARK_CORE_sgeqp3_larfg(Quark *quark, Quark_Task_Flags *task_flags,
625 float *tau,
float *beta );
626 void QUARK_CORE_sgeqp3_norms( Quark *quark, Quark_Task_Flags *task_flags,
627 PLASMA_desc A,
int ioff,
int joff,
float *norms1,
float *norms2 );
628 void QUARK_CORE_sgeqp3_pivot( Quark *quark, Quark_Task_Flags *task_flags,
631 int jj,
int k,
int *jpvt,
632 float *norms1,
float *norms2,
int *info );
633 void QUARK_CORE_sgeqp3_tntpiv(Quark *quark, Quark_Task_Flags *task_flags,
634 int m,
int n,
int nb,
638 PLASMA_bool check_info,
int iinfo);
639 void QUARK_CORE_sgeqp3_update( Quark *quark, Quark_Task_Flags *task_flags,
640 float *Ajj,
int lda1,
641 float *Ajk,
int lda2,
643 int joff,
int k,
int koff,
int nb,
644 float *norms1,
float *norms2,
int *info );
645 void QUARK_CORE_sgeqrt(Quark *quark, Quark_Task_Flags *task_flags,
646 int m,
int n,
int ib,
int nb,
649 void QUARK_CORE_sgessm(Quark *quark, Quark_Task_Flags *task_flags,
650 int m,
int n,
int k,
int ib,
int nb,
652 const float *L,
int ldl,
654 void QUARK_CORE_sgessq_f1( Quark *quark, Quark_Task_Flags *task_flags,
655 int m,
int n,
const float *A,
int lda,
656 float *scale,
float *sumsq,
657 float *fake,
int szeF,
int paramF );
658 void QUARK_CORE_sgetrf(Quark *quark, Quark_Task_Flags *task_flags,
659 int m,
int n,
int nb,
663 PLASMA_bool check_info,
int iinfo);
664 void QUARK_CORE_sgetrf_incpiv(Quark *quark, Quark_Task_Flags *task_flags,
665 int m,
int n,
int ib,
int nb,
669 PLASMA_bool check_info,
int iinfo);
670 void QUARK_CORE_sgetrf_nopiv(Quark *quark, Quark_Task_Flags *task_flags,
671 int m,
int n,
int ib,
int nb,
675 void QUARK_CORE_sgetrf_reclap(Quark *quark, Quark_Task_Flags *task_flags,
676 int m,
int n,
int nb,
680 PLASMA_bool check_info,
int iinfo,
682 void QUARK_CORE_sgetrf_rectil(Quark *quark, Quark_Task_Flags *task_flags,
686 PLASMA_bool check_info,
int iinfo,
688 void QUARK_CORE_sgetrip(Quark *quark, Quark_Task_Flags *task_flags,
689 int m,
int n,
float *A,
int szeA);
690 void QUARK_CORE_sgetrip_f1(Quark *quark, Quark_Task_Flags *task_flags,
691 int m,
int n,
float *A,
int szeA,
692 float *fake,
int szeF,
int paramF);
693 void QUARK_CORE_sgetrip_f2(Quark *quark, Quark_Task_Flags *task_flags,
694 int m,
int n,
float *A,
int szeA,
695 float *fake1,
int szeF1,
int paramF1,
696 float *fake2,
int szeF2,
int paramF2);
697 void QUARK_CORE_ssymm(Quark *quark, Quark_Task_Flags *task_flags,
698 PLASMA_enum side, PLASMA_enum uplo,
699 int m,
int n,
int nb,
700 float alpha,
const float *A,
int lda,
701 const float *B,
int ldb,
702 float beta,
float *C,
int ldc);
703 void QUARK_CORE_ssygst(Quark *quark, Quark_Task_Flags *task_flags,
704 int itype, PLASMA_enum uplo,
int N,
709 void QUARK_CORE_ssyrk(Quark *quark, Quark_Task_Flags *task_flags,
710 PLASMA_enum uplo, PLASMA_enum trans,
711 int n,
int k,
int nb,
712 float alpha,
const float *A,
int lda,
713 float beta,
float *C,
int ldc);
714 void QUARK_CORE_ssyr2k(Quark *quark, Quark_Task_Flags *task_flags,
715 PLASMA_enum uplo, PLASMA_enum trans,
716 int n,
int k,
int nb,
717 float alpha,
const float *A,
int lda,
718 const float *B,
int LDB,
719 float beta,
float *C,
int ldc);
720 void QUARK_CORE_ssyrfb(Quark *quark, Quark_Task_Flags *task_flags,
722 int n,
int k,
int ib,
int nb,
723 const float *A,
int lda,
724 const float *T,
int ldt,
726 void QUARK_CORE_shessq_f1( Quark *quark, Quark_Task_Flags *task_flags,
727 PLASMA_enum uplo,
int n,
const float *A,
int lda,
728 float *scale,
float *sumsq,
729 float *fake,
int szeF,
int paramF );
730 void QUARK_CORE_slacpy(Quark *quark, Quark_Task_Flags *task_flags,
731 PLASMA_enum uplo,
int m,
int n,
int mb,
732 const float *A,
int lda,
734 void QUARK_CORE_slacpy_f1(Quark *quark, Quark_Task_Flags *task_flags,
735 PLASMA_enum uplo,
int m,
int n,
int nb,
736 const float *A,
int lda,
738 float *fake1,
int szefake1,
int flag1);
739 void QUARK_CORE_slacpy_pivot(Quark *quark, Quark_Task_Flags *task_flags,
742 int k1,
int k2,
const int *ipiv,
743 int *rankin,
int *rankout,
746 void QUARK_CORE_slange(Quark *quark, Quark_Task_Flags *task_flags,
747 int norm,
int M,
int N,
748 const float *A,
int LDA,
int szeA,
749 int szeW,
float *result);
750 void QUARK_CORE_slange_f1(Quark *quark, Quark_Task_Flags *task_flags,
751 int norm,
int M,
int N,
752 const float *A,
int LDA,
int szeA,
753 int szeW,
float *result,
754 float *fake,
int szeF);
756 void QUARK_CORE_slansy(Quark *quark, Quark_Task_Flags *task_flags,
757 int norm, PLASMA_enum uplo,
int N,
758 const float *A,
int LDA,
int szeA,
759 int szeW,
float *result);
760 void QUARK_CORE_slansy_f1(Quark *quark, Quark_Task_Flags *task_flags,
761 int norm, PLASMA_enum uplo,
int N,
762 const float *A,
int LDA,
int szeA,
763 int szeW,
float *result,
764 float *fake,
int szeF);
766 void QUARK_CORE_slansy(Quark *quark, Quark_Task_Flags *task_flags,
767 int norm, PLASMA_enum uplo,
int N,
768 const float *A,
int LDA,
int szeA,
769 int szeW,
float *result);
770 void QUARK_CORE_slansy_f1(Quark *quark, Quark_Task_Flags *task_flags,
771 int norm, PLASMA_enum uplo,
int N,
772 const float *A,
int LDA,
int szeA,
773 int szeW,
float *result,
774 float *fake,
int szeF);
775 void QUARK_CORE_slantr(Quark *quark, Quark_Task_Flags *task_flags,
776 PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag,
int M,
int N,
777 const float *A,
int LDA,
int szeA,
778 int szeW,
float *result);
779 void QUARK_CORE_slantr_f1(Quark *quark, Quark_Task_Flags *task_flags,
780 PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag,
int M,
int N,
781 const float *A,
int LDA,
int szeA,
782 int szeW,
float *result,
783 float *fake,
int szeF);
784 void QUARK_CORE_slaset(Quark *quark, Quark_Task_Flags *task_flags,
785 PLASMA_enum uplo,
int n1,
int n2,
float alpha,
786 float beta,
float *tileA,
int ldtilea);
787 void QUARK_CORE_slaset2(Quark *quark, Quark_Task_Flags *task_flags,
788 PLASMA_enum uplo,
int n1,
int n2,
float alpha,
789 float *tileA,
int ldtilea);
790 void QUARK_CORE_slaswp(Quark *quark, Quark_Task_Flags *task_flags,
791 int n,
float *A,
int lda,
792 int i1,
int i2,
const int *ipiv,
int inc);
793 void QUARK_CORE_slaswp_f2(Quark *quark, Quark_Task_Flags *task_flags,
794 int n,
float *A,
int lda,
795 int i1,
int i2,
const int *ipiv,
int inc,
796 float *fake1,
int szefake1,
int flag1,
797 float *fake2,
int szefake2,
int flag2);
798 void QUARK_CORE_slaswp_ontile(Quark *quark, Quark_Task_Flags *task_flags,
800 int i1,
int i2,
const int *ipiv,
int inc,
float *fakepanel);
801 void QUARK_CORE_slaswp_ontile_f2(Quark *quark, Quark_Task_Flags *task_flags,
803 int i1,
int i2,
const int *ipiv,
int inc,
804 float *fake1,
int szefake1,
int flag1,
805 float *fake2,
int szefake2,
int flag2);
806 void QUARK_CORE_slaswpc_ontile(Quark *quark, Quark_Task_Flags *task_flags,
808 int i1,
int i2,
const int *ipiv,
int inc,
float *fakepanel);
809 void QUARK_CORE_slatro(Quark *quark, Quark_Task_Flags *task_flags,
810 PLASMA_enum uplo, PLASMA_enum trans,
int m,
int n,
int mb,
811 const float *A,
int lda,
813 void QUARK_CORE_slatro_f1(Quark *quark, Quark_Task_Flags *task_flags,
814 PLASMA_enum uplo, PLASMA_enum trans,
int m,
int n,
int mb,
815 const float *A,
int lda,
817 float *fake1,
int szefake1,
int flag1);
818 void QUARK_CORE_slauum(Quark *quark, Quark_Task_Flags *task_flags,
819 PLASMA_enum uplo,
int n,
int nb,
821 void QUARK_CORE_splgsy(Quark *quark, Quark_Task_Flags *task_flags,
822 float bump,
int m,
int n,
float *A,
int lda,
823 int bigM,
int m0,
int n0,
unsigned long long int seed );
824 void QUARK_CORE_splgsy(Quark *quark, Quark_Task_Flags *task_flags,
825 float bump,
int m,
int n,
float *A,
int lda,
826 int bigM,
int m0,
int n0,
unsigned long long int seed );
827 void QUARK_CORE_splrnt(Quark *quark, Quark_Task_Flags *task_flags,
828 int m,
int n,
float *A,
int lda,
829 int bigM,
int m0,
int n0,
unsigned long long int seed );
830 void QUARK_CORE_spltmg(Quark *quark, Quark_Task_Flags *task_flags,
831 PLASMA_enum mtxtype,
int m,
int n,
float *A,
int lda,
832 int gM,
int gN,
int m0,
int n0,
unsigned long long int seed );
833 void QUARK_CORE_spltmg_chebvand( Quark *quark, Quark_Task_Flags *task_flags,
834 int M,
int N,
float *A,
int LDA,
835 int gN,
int m0,
int n0,
837 void QUARK_CORE_spltmg_circul( Quark *quark, Quark_Task_Flags *task_flags,
838 int M,
int N,
float *A,
int LDA,
839 int gM,
int m0,
int n0,
841 void QUARK_CORE_spltmg_fiedler(Quark *quark, Quark_Task_Flags *task_flags,
843 const float *X,
int incX,
844 const float *Y,
int incY,
846 void QUARK_CORE_spltmg_hankel( Quark *quark, Quark_Task_Flags *task_flags,
847 PLASMA_enum uplo,
int M,
int N,
float *A,
int LDA,
848 int m0,
int n0,
int nb,
851 void QUARK_CORE_spltmg_toeppd1(Quark *quark, Quark_Task_Flags *task_flags,
852 int gM,
int m0,
int M,
854 unsigned long long int seed);
855 void QUARK_CORE_spltmg_toeppd2(Quark *quark, Quark_Task_Flags *task_flags,
856 int M,
int N,
int K,
int m0,
int n0,
859 void QUARK_CORE_spotrf(Quark *quark, Quark_Task_Flags *task_flags,
860 PLASMA_enum uplo,
int n,
int nb,
864 void QUARK_CORE_ssetvar(Quark *quark, Quark_Task_Flags *task_flags,
865 const float *alpha,
float *x,
867 void QUARK_CORE_sshift( Quark *quark, Quark_Task_Flags *task_flags,
868 int s,
int m,
int n,
int L,
870 void QUARK_CORE_sshiftw(Quark *quark, Quark_Task_Flags *task_flags,
871 int s,
int cl,
int m,
int n,
int L,
873 void QUARK_CORE_sssssm(Quark *quark, Quark_Task_Flags *task_flags,
874 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
877 const float *L1,
int ldl1,
878 const float *L2,
int ldl2,
880 void QUARK_CORE_sstedc(Quark *quark, Quark_Task_Flags *task_flags,
881 PLASMA_enum compz,
int n,
884 void QUARK_CORE_sstedc_f2(Quark *quark, Quark_Task_Flags *task_flags,
885 PLASMA_enum compz,
int n,
888 void *fake1,
int szefake1,
int flag1,
889 void *fake2,
int szefake2,
int flag2);
890 void QUARK_CORE_ssteqr(Quark *quark, Quark_Task_Flags *task_flags,
891 PLASMA_enum compz,
int n,
894 void QUARK_CORE_ssymm(Quark *quark, Quark_Task_Flags *task_flags,
895 PLASMA_enum side, PLASMA_enum uplo,
896 int m,
int n,
int nb,
897 float alpha,
const float *A,
int lda,
898 const float *B,
int ldb,
899 float beta,
float *C,
int ldc);
900 void QUARK_CORE_ssyrk(Quark *quark, Quark_Task_Flags *task_flags,
901 PLASMA_enum uplo, PLASMA_enum trans,
902 int n,
int k,
int nb,
903 float alpha,
const float *A,
int lda,
904 float beta,
float *C,
int ldc);
905 void QUARK_CORE_ssyr2k(Quark *quark, Quark_Task_Flags *task_flags,
906 PLASMA_enum uplo, PLASMA_enum trans,
907 int n,
int k,
int nb,
908 float alpha,
const float *A,
int lda,
909 const float *B,
int LDB,
910 float beta,
float *C,
int ldc);
911 void QUARK_CORE_ssyssq_f1( Quark *quark, Quark_Task_Flags *task_flags,
912 PLASMA_enum uplo,
int n,
const float *A,
int lda,
913 float *scale,
float *sumsq,
914 float *fake,
int szeF,
int paramF );
915 void QUARK_CORE_sswpab(Quark *quark, Quark_Task_Flags *task_flags,
916 int i,
int n1,
int n2,
918 void QUARK_CORE_sswptr_ontile(Quark *quark, Quark_Task_Flags *task_flags,
920 int i1,
int i2,
const int *ipiv,
int inc,
921 const float *Akk,
int ldak);
922 void QUARK_CORE_strasm(Quark *quark, Quark_Task_Flags *task_flags,
923 PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag,
int m,
int n,
924 const float *A,
int lda,
int szeA,
925 float *work,
int szeW);
926 void QUARK_CORE_strasm_f1(Quark *quark, Quark_Task_Flags *task_flags,
927 PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag,
int m,
int n,
928 const float *A,
int lda,
int szeA,
929 float *work,
int szeW,
930 float *fake,
int szeF);
931 void QUARK_CORE_strdalg1(Quark *quark, Quark_Task_Flags *task_flags,
938 int Vblksiz,
int wantz,
939 int i,
int sweepid,
int m,
int grsiz,
940 int *PCOL,
int *ACOL,
int *MCOL);
941 void QUARK_CORE_strmm(Quark *quark, Quark_Task_Flags *task_flags,
942 PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag,
943 int m,
int n,
int nb,
944 float alpha,
const float *A,
int lda,
946 void QUARK_CORE_strmm_p2(Quark *quark, Quark_Task_Flags *task_flags,
947 PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag,
948 int m,
int n,
int nb,
949 float alpha,
const float *A,
int lda,
951 void QUARK_CORE_strsm(Quark *quark, Quark_Task_Flags *task_flags,
952 PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag,
953 int m,
int n,
int nb,
954 float alpha,
const float *A,
int lda,
956 void QUARK_CORE_strssq_f1( Quark *quark, Quark_Task_Flags *task_flags,
957 PLASMA_enum uplo, PLASMA_enum diag,
958 int m,
int n,
const float *A,
int lda,
959 float *scale,
float *sumsq,
960 float *fake,
int szeF,
int paramF );
961 void QUARK_CORE_strtri(Quark *quark, Quark_Task_Flags *task_flags,
962 PLASMA_enum uplo, PLASMA_enum diag,
int n,
int nb,
966 void QUARK_CORE_stslqt(Quark *quark, Quark_Task_Flags *task_flags,
967 int m,
int n,
int ib,
int nb,
971 void QUARK_CORE_stsmlq(Quark *quark, Quark_Task_Flags *task_flags,
972 PLASMA_enum side, PLASMA_enum trans,
973 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
976 const float *V,
int ldv,
977 const float *T,
int ldt);
978 void QUARK_CORE_stsmlq_sytra1(Quark *quark, Quark_Task_Flags *task_flags,
979 PLASMA_enum side, PLASMA_enum trans,
980 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
983 const float *V,
int ldv,
984 const float *T,
int ldt);
985 void QUARK_CORE_stsmlq_corner(Quark *quark, Quark_Task_Flags *task_flags,
986 int m1,
int n1,
int m2,
int n2,
int m3,
int n3,
int k,
int ib,
int nb,
990 const float *V,
int ldv,
991 const float *T,
int ldt);
992 void QUARK_CORE_stsmqr(Quark *quark, Quark_Task_Flags *task_flags,
993 PLASMA_enum side, PLASMA_enum trans,
994 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
997 const float *V,
int ldv,
998 const float *T,
int ldt);
999 void QUARK_CORE_stsmqr_sytra1(Quark *quark, Quark_Task_Flags *task_flags,
1000 PLASMA_enum side, PLASMA_enum trans,
1001 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
1002 float *A1,
int lda1,
1003 float *A2,
int lda2,
1004 const float *V,
int ldv,
1005 const float *T,
int ldt);
1006 void QUARK_CORE_stsmqr_corner(Quark *quark, Quark_Task_Flags *task_flags,
1007 int m1,
int n1,
int m2,
int n2,
int m3,
int n3,
int k,
int ib,
int nb,
1008 float *A1,
int lda1,
1009 float *A2,
int lda2,
1010 float *A3,
int lda3,
1011 const float *V,
int ldv,
1012 const float *T,
int ldt);
1013 void QUARK_CORE_stsqrt(Quark *quark, Quark_Task_Flags *task_flags,
1014 int m,
int n,
int ib,
int nb,
1015 float *A1,
int lda1,
1016 float *A2,
int lda2,
1018 void QUARK_CORE_ststrf(Quark *quark, Quark_Task_Flags *task_flags,
1019 int m,
int n,
int ib,
int nb,
1025 PLASMA_bool check_info,
int iinfo);
1026 void QUARK_CORE_sttmqr(Quark *quark, Quark_Task_Flags *task_flags,
1027 PLASMA_enum side, PLASMA_enum trans,
1028 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
1029 float *A1,
int lda1,
1030 float *A2,
int lda2,
1031 const float *V,
int ldv,
1032 const float *T,
int ldt);
1033 void QUARK_CORE_sttqrt(Quark *quark, Quark_Task_Flags *task_flags,
1034 int m,
int n,
int ib,
int nb,
1035 float *A1,
int lda1,
1036 float *A2,
int lda2,
1038 void QUARK_CORE_sttmlq(Quark *quark, Quark_Task_Flags *task_flags,
1039 PLASMA_enum side, PLASMA_enum trans,
1040 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
1041 float *A1,
int lda1,
1042 float *A2,
int lda2,
1043 const float *V,
int ldv,
1044 const float *T,
int ldt);
1045 void QUARK_CORE_sttlqt(Quark *quark, Quark_Task_Flags *task_flags,
1046 int m,
int n,
int ib,
int nb,
1047 float *A1,
int lda1,
1048 float *A2,
int lda2,
1050 void QUARK_CORE_spamm(Quark *quark, Quark_Task_Flags *task_flags,
1051 int op, PLASMA_enum side, PLASMA_enum storev,
1052 int m,
int n,
int k,
int l,
1053 const float *A1,
int lda1,
1054 float *A2,
int lda2,
1055 const float *V,
int ldv,
1057 void QUARK_CORE_splssq( Quark *quark, Quark_Task_Flags *task_flags,
1058 int m,
const float *A,
float *result );
1059 void QUARK_CORE_sormlq(Quark *quark, Quark_Task_Flags *task_flags,
1060 PLASMA_enum side, PLASMA_enum trans,
1061 int m,
int n,
int ib,
int nb,
int k,
1062 const float *A,
int lda,
1063 const float *T,
int ldt,
1065 void QUARK_CORE_sormqr(Quark *quark, Quark_Task_Flags *task_flags,
1066 PLASMA_enum side, PLASMA_enum trans,
1067 int m,
int n,
int k,
int ib,
int nb,
1068 const float *A,
int lda,
1069 const float *T,
int ldt,
1073 void QUARK_CORE_slascl(Quark *quark, Quark_Task_Flags *task_flags,
1074 PLASMA_enum type,
int kl,
int ku,
float cfrom,
float cto,
1075 int m,
int n,
float *A,
int lda);
1076 void QUARK_CORE_slascl_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
1077 PLASMA_enum type,
int kl,
int ku,
float *cfrom,
float *cto,
1078 int m,
int n,
float *A,
int lda,
1079 void *fake,
int szefake,
int flag);
1080 void QUARK_CORE_slaed0_lascl( Quark *quark, Quark_Task_Flags *task_flags,
1081 int n,
float *scale,
float *D,
float *E);
1082 void QUARK_CORE_slaed0_betaapprox(Quark *quark, Quark_Task_Flags *task_flags,
1083 int subpbs,
const int *subpbs_info,
1084 float *D,
const float *E);
1087 void QUARK_CORE_slaed2_computeK(Quark *quark, Quark_Task_Flags *task_flags,
1088 int *K1,
int n,
int n1,
1089 float *beta,
float *D,
float *Q,
int LDQ,
1090 float *Z,
float *DLAMBDA,
float *W,
1091 int *INDX,
int *INDXC,
int *INDXP,
int *INDXQ,
1093 float **Qmerge,
int wsmode,
1096 void QUARK_CORE_slaed1_pipelined(Quark *quark, Quark_Task_Flags *task_flags,
1097 int n,
int n1,
const int *K,
1098 const int *INDX,
const int *ctot,
1099 float *D,
const float *beta,
1100 float *Q,
int LDQ,
float *Q2,
1101 const float *DLAMBDA,
const float *W,
float *Wred,
1102 int start,
int end);
1103 void QUARK_CORE_slaed2_compressq(Quark *quark, Quark_Task_Flags *task_flags,
1104 int n,
int n1,
int start,
int end,
1105 const int *INDX,
const int *ctot,
1106 const float *Q,
int LDQ,
1108 void QUARK_CORE_slaed4_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
1109 int n,
const int *K,
1110 float *D,
const float *beta,
1111 float **Q,
const int *LDQ,
1112 const float *DLAMBDA,
const float *W,
const int *INDX,
1115 void *fakeQ,
int flagfQ);
1116 void QUARK_CORE_slaed3_compW_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
1117 int n,
const int *K,
1118 float **Q,
const int *LDQ,
1119 const float *DLAMBDA,
float *W,
1122 void *fakeQ,
int flagfQ,
1123 void *fakeW,
int flagfW);
1125 void QUARK_CORE_slaed3_reduceW(Quark *quark, Quark_Task_Flags *task_flags,
1126 int n,
int n1,
const int *K,
int l,
1127 const float *Q,
int LDQ,
1128 const float *Wred,
float *W);
1129 void QUARK_CORE_slaed3_reduceW_p2(Quark *quark, Quark_Task_Flags *task_flags,
1130 int n,
int n1,
const int *K,
int l,
1131 float **Q,
const int *LDQ,
1132 const float *Wred,
float *W);
1134 void QUARK_CORE_slaed2_copydef(Quark *quark, Quark_Task_Flags *task_flags,
1135 int n,
int n1,
const int *K,
const int *ctot,
1136 float *Q,
int LDQ,
const float *Q2,
1137 int start,
int end);
1138 void QUARK_CORE_slaed3_computevectors(Quark *quark, Quark_Task_Flags *task_flags,
1139 int wsmode,
int n,
const int *K,
1140 const int *il_nondef,
const int *iu_nondef,
1141 float *Q,
int LDQ,
float *W,
const int *INDXC,
1142 float **WSglobal,
float **WSlocal,
1143 int start,
int end );
1144 void QUARK_CORE_slaed3_wscopy( Quark *quark, Quark_Task_Flags *task_flags,
1145 const int *K,
const int *il_nondef,
const int *iu_nondef,
1146 const float *Q,
int LDQ,
float **WORK,
1147 int start,
int end );
1148 void QUARK_CORE_slaed3_updatevectors(Quark *quark, Quark_Task_Flags *task_flags,
1149 int oper,
int wsmode,
int n,
int n1,
int *K,
1150 int *il_nondef,
int *iu_nondef,
1151 float *D,
float *Q,
int LDQ,
float *Q2,
1152 int *INDXQ,
int *COLTYP,
float **WORK,
1153 int start,
int end,
float **WORKDEP);
1154 void QUARK_CORE_slaed3_pipelined(Quark *quark, Quark_Task_Flags *task_flags,
1155 int n,
int n1,
int *K,
int *il_nondef,
int *iu_nondef,
1156 float *D,
float *Q,
int LDQ,
float *Q2,
1157 int *INDXC,
int *INDXQ,
int *COLTYP,
float *W,
1158 int start,
int end2);
1160 void QUARK_CORE_sDC_fakedep(Quark *quark, Quark_Task_Flags *task_flags,
1161 int nb_tasks,
int nb,
float *Q,
int LDQ,
float *W);
1164 void QUARK_CORE_sswap(Quark *quark, Quark_Task_Flags *task_flags,
1165 int m,
int n,
float *Q,
1166 int LDQ,
float *work,
1167 int *perm,
int begin,
int end);
1169 void QUARK_CORE_slag2c(Quark *quark, Quark_Task_Flags *task_flags,
1171 const float *Q,
int LDQ,
1174 void QUARK_CORE_slaed3_freebigwork(Quark *quark, Quark_Task_Flags *task_flags,
1175 int *K_bis,
int largework,
float **WORK);
1176 void QUARK_CORE_slaset_identity(Quark *quark, Quark_Task_Flags *task_flags,
1177 int n,
int start,
int size,
1183 void CORE_sasum_quark(Quark *quark);
1184 void CORE_sasum_f1_quark(Quark *quark);
1185 void CORE_sgeadd_quark(Quark *quark);
1186 void CORE_sbrdalg1_quark(Quark *quark);
1187 void CORE_sgelqt_quark(Quark *quark);
1188 void CORE_sgemm_quark(Quark *quark);
1189 void CORE_sgemm_tile_quark(Quark *quark);
1190 void CORE_sgemv_quark(Quark *quark);
1191 void CORE_sgemv_tile_quark(Quark *quark);
1192 void CORE_sgeqp3_init_quark(Quark *quark);
1193 void CORE_sgeqp3_larfg_quark(Quark *quark);
1194 void CORE_sgeqp3_norms_quark(Quark *quark);
1195 void CORE_sgeqp3_pivot_quark(Quark *quark);
1196 void CORE_sgeqp3_tntpiv_quark(Quark *quark);
1197 void CORE_sgeqp3_update_quark(Quark *quark);
1198 void CORE_sgeqrt_quark(Quark *quark);
1199 void CORE_sgessm_quark(Quark *quark);
1200 void CORE_sgessq_quark(Quark *quark);
1201 void CORE_sgessq_f1_quark(Quark *quark);
1202 void CORE_sgetrf_quark(Quark *quark);
1203 void CORE_sgetrf_incpiv_quark(Quark *quark);
1204 void CORE_sgetrf_nopiv_quark(Quark* quark);
1205 void CORE_sgetrf_reclap_quark(Quark *quark);
1206 void CORE_sgetrf_rectil_quark(Quark* quark);
1207 void CORE_sgetrip_quark(Quark *quark);
1208 void CORE_sgetrip_f1_quark(Quark *quark);
1209 void CORE_sgetrip_f2_quark(Quark *quark);
1211 void CORE_ssymm_quark(Quark *quark);
1212 void CORE_ssyrk_quark(Quark *quark);
1213 void CORE_ssyr2k_quark(Quark *quark);
1215 void CORE_ssygst_quark(Quark *quark);
1216 void CORE_ssyrfb_quark(Quark *quark);
1217 void CORE_shessq_quark(Quark *quark);
1218 void CORE_shessq_f1_quark(Quark *quark);
1219 void CORE_slacpy_quark(Quark *quark);
1220 void CORE_slacpy_f1_quark(Quark *quark);
1221 void CORE_slacpy_pivot_quark(Quark *quark);
1222 void CORE_slatro_quark(Quark *quark);
1223 void CORE_slatro_f1_quark(Quark *quark);
1224 void CORE_slange_quark(Quark *quark);
1225 void CORE_slange_f1_quark(Quark *quark);
1227 void CORE_slansy_quark(Quark *quark);
1228 void CORE_slansy_f1_quark(Quark *quark);
1230 void CORE_slansy_quark(Quark *quark);
1231 void CORE_slansy_f1_quark(Quark *quark);
1232 void CORE_slaset_quark(Quark *quark);
1233 void CORE_slaset2_quark(Quark *quark);
1234 void CORE_slatro_quark(Quark *quark);
1235 void CORE_slauum_quark(Quark *quark);
1236 void CORE_spamm_quark(Quark *quark);
1237 void CORE_splgsy_quark(Quark *quark);
1238 void CORE_splgsy_quark(Quark *quark);
1239 void CORE_splrnt_quark(Quark *quark);
1240 void CORE_spltmg_quark(Quark *quark);
1241 void CORE_splssq_quark(Quark *quark);
1242 void CORE_spotrf_quark(Quark *quark);
1243 void CORE_ssetvar_quark(Quark *quark);
1244 void CORE_sshift_quark(Quark *quark);
1245 void CORE_sshiftw_quark(Quark *quark);
1246 void CORE_sssssm_quark(Quark *quark);
1247 void CORE_ssymm_quark(Quark *quark);
1248 void CORE_ssyrk_quark(Quark *quark);
1249 void CORE_ssyr2k_quark(Quark *quark);
1250 void CORE_ssyssq_quark(Quark *quark);
1251 void CORE_ssyssq_f1_quark(Quark *quark);
1252 void CORE_sswpab_quark(Quark *quark);
1253 void CORE_sswptr_ontile_quark(Quark *quark);
1254 void CORE_strdalg1_quark(Quark *quark);
1255 void CORE_strmm_quark(Quark *quark);
1256 void CORE_strsm_quark(Quark *quark);
1257 void CORE_strtri_quark(Quark *quark);
1258 void CORE_stslqt_quark(Quark *quark);
1259 void CORE_stsmlq_quark(Quark *quark);
1260 void CORE_stsmlq_sytra1_quark(Quark *quark);
1261 void CORE_stsmlq_corner_quark(Quark *quark);
1262 void CORE_stsmqr_quark(Quark *quark);
1263 void CORE_stsmqr_sytra1_quark(Quark *quark);
1264 void CORE_stsmqr_corner_quark(Quark *quark);
1265 void CORE_stsqrt_quark(Quark *quark);
1266 void CORE_ststrf_quark(Quark *quark);
1267 void CORE_sttmqr_quark(Quark *quark);
1268 void CORE_sttqrt_quark(Quark *quark);
1269 void CORE_sttmlq_quark(Quark *quark);
1270 void CORE_sttlqt_quark(Quark *quark);
1271 void CORE_sormlq_quark(Quark *quark);
1272 void CORE_sormqr_quark(Quark *quark);
1273 void CORE_slaswp_quark(Quark* quark);
1274 void CORE_slaswp_f2_quark(Quark* quark);
1275 void CORE_slaswp_ontile_quark(Quark *quark);
1276 void CORE_slaswp_ontile_f2_quark(Quark *quark);
1277 void CORE_slaswpc_ontile_quark(Quark *quark);
1278 void CORE_strmm_p2_quark(Quark* quark);
1279 void CORE_sgemm_f2_quark(Quark* quark);
1280 void CORE_sgemm_p2_quark(Quark* quark);
1281 void CORE_sgemm_p2f1_quark(Quark* quark);
1282 void CORE_sgemm_p3_quark(Quark* quark);
int CORE_sttqrt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sttqrt.c:116
int CORE_stsmlq(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_stsmlq.c:124
int CORE_sgetf2_nopiv(int m, int n, float *A, int lda)
Definition: core_sgetf2_nopiv.c:64
void CORE_spotrf(PLASMA_enum uplo, int N, float *A, int LDA, int *INFO)
Definition: core_spotrf.c:68
int CORE_slarfx2c(PLASMA_enum uplo, float V, float TAU, float *C1, float *C2, float *C3)
Definition: core_slarfx_tbrd.c:177
int CORE_sswptr_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc, const float *Akk, int ldak)
Definition: core_slaswp.c:224
void CORE_sgbtype1cb(PLASMA_enum uplo, int N, int NB, float *A, int LDA, float *VQ, float *TAUQ, float *VP, float *TAUP, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_sgbtype1cb.c:102
void CORE_strsm(PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag, int M, int N, float alpha, const float *A, int LDA, float *B, int LDB)
Definition: core_strsm.c:80
int CORE_sttmlq(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_sttmlq.c:116
int CORE_spltmg_chebvand(int M, int N, float *A, int LDA, int gN, int m0, int n0, float *W)
Definition: core_spltmg_chebvand.c:83
int CORE_spamm(int op, PLASMA_enum side, PLASMA_enum storev, int M, int N, int K, int L, const float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, float *W, int LDW)
Definition: core_spamm.c:175
void CORE_ssyrk(PLASMA_enum uplo, PLASMA_enum trans, int N, int K, float alpha, const float *A, int LDA, float beta, float *C, int LDC)
Definition: core_ssyrk.c:80
void CORE_ssbtype2cb(int N, int NB, float *A, int LDA, float *V, float *TAU, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_ssbtype2cb.c:101
void CORE_sgeqp3_larfg(PLASMA_desc A, int ii, int jj, int i, int j, float *tau, float *beta)
Definition: core_sgeqp3_larfg.c:78
int CORE_shbrce(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_shbrce.c:78
void CORE_sswap(int m, int n, float *Q, int ldq, const float *work, const int *perm, int start, int end)
Definition: core_sswap.c:67
int CORE_spltmg(PLASMA_enum mtxtype, int m, int n, float *A, int lda, int gM, int gN, int m0, int n0, unsigned long long int seed)
Definition: core_spltmg.c:90
int CORE_slaswp_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc)
Definition: core_slaswp.c:107
void CORE_slaset(PLASMA_enum uplo, int n1, int n2, float alpha, float beta, float *tileA, int ldtilea)
Definition: core_slaset.c:57
int CORE_ssyrfb(PLASMA_enum uplo, int N, int K, int IB, int NB, const float *A, int LDA, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_ssyrfb.c:110
int CORE_sgessm(int M, int N, int K, int IB, const int *IPIV, const float *L, int LDL, float *A, int LDA)
Definition: core_sgessm.c:70
int CORE_shblrx(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_shblrx.c:78
int CORE_slarfx2(PLASMA_enum side, int N, float V, float TAU, float *C1, int LDC1, float *C2, int LDC2)
Definition: core_slarfx_tbrd.c:82
void CORE_sgeqp3_pivot(PLASMA_desc A, float *F, int ldf, int jj, int k, int *jpvt, float *norms1, float *norms2, int *info)
Definition: core_sgeqp3_pivot.c:68
void CORE_sshiftw(int s, int cl, int m, int n, int L, float *A, float *W)
Definition: core_sshift.c:66
void CORE_strasm(PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag, int M, int N, const float *A, int lda, float *work)
Definition: core_strasm.c:66
void CORE_spltmg_condexq(int M, int N, float *Q, int LDQ)
Definition: core_spltmg_condex.c:53
void CORE_sgeqp3_update(const float *Ajj, int lda1, float *Ajk, int lda2, const float *Fk, int ldf, int joff, int k, int koff, int nb, float *norms1, float *norms2, int *info)
Definition: core_sgeqp3_update.c:82
void CORE_sgeqp3_norms(PLASMA_desc A, int ioff, int joff, float *norms1, float *norms2)
Definition: core_sgeqp3_norms.c:62
void CORE_ssygst(int itype, PLASMA_enum uplo, int N, float *A, int LDA, float *B, int LDB, int *INFO)
Definition: core_ssygst.c:80
void CORE_strmm(PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag, int M, int N, float alpha, const float *A, int LDA, float *B, int LDB)
Definition: core_strmm.c:84
void CORE_slantr(PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag, int M, int N, const float *A, int LDA, float *work, float *normA)
Definition: core_slantr.c:84
int CORE_sgetrf_incpiv(int M, int N, int IB, float *A, int LDA, int *IPIV, int *INFO)
Definition: core_sgetrf_incpiv.c:83
int CORE_stsmqr(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_stsmqr.c:124
void CORE_sbrdalg1(PLASMA_enum uplo, int n, int nb, float *A, int lda, float *VQ, float *TAUQ, float *VP, float *TAUP, int Vblksiz, int wantz, int i, int sweepid, int m, int grsiz, float *work)
Definition: core_sbrdalg1.c:111
int CORE_sparfb(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev, int M1, int N1, int M2, int N2, int K, int L, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_sparfb.c:132
int CORE_stsmqr_corner(int m1, int n1, int m2, int n2, int m3, int n3, int k, int ib, int nb, float *A1, int lda1, float *A2, int lda2, float *A3, int lda3, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmqr_corner.c:130
int CORE_sgbrce(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_sgbrce.c:78
int CORE_stsmlq_corner(int m1, int n1, int m2, int n2, int m3, int n3, int k, int ib, int nb, float *A1, int lda1, float *A2, int lda2, float *A3, int lda3, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmlq_corner.c:130
void CORE_ssbtype1cb(int N, int NB, float *A, int LDA, float *V, float *TAU, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_ssbtype1cb.c:97
int CORE_sttmqr(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_sttmqr.c:116
int CORE_sgeqrt(int M, int N, int IB, float *A, int LDA, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sgeqrt.c:86
void CORE_splrnt(int m, int n, float *A, int lda, int bigM, int m0, int n0, unsigned long long int seed)
Definition: core_splrnt.c:68
void CORE_slauum(PLASMA_enum uplo, int N, float *A, int LDA)
Definition: core_slauum.c:57
void CORE_ssbtype3cb(int N, int NB, float *A, int LDA, const float *V, const float *TAU, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_ssbtype3cb.c:98
void CORE_slange(int norm, int M, int N, const float *A, int LDA, float *work, float *normA)
Definition: core_slange.c:72
int CORE_slatro(PLASMA_enum uplo, PLASMA_enum trans, int M, int N, const float *A, int LDA, float *B, int LDB)
Definition: core_slatro.c:80
void CORE_strdalg1(int n, int nb, float *A, int lda, float *V, float *TAU, int Vblksiz, int wantz, int i, int sweepid, int m, int grsiz, float *work)
Definition: core_strdalg1.c:91
int CORE_slarfx2ce(PLASMA_enum uplo, float *V, float *TAU, float *C1, float *C2, float *C3)
Definition: core_slarfx_tbrd.c:323
int CORE_sgbelr(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_sgbelr.c:81
int CORE_stsmqr_sytra1(PLASMA_enum side, PLASMA_enum trans, int m1, int n1, int m2, int n2, int k, int ib, float *A1, int lda1, float *A2, int lda2, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmqr_sytra1.c:127
int CORE_slacpy_pivot(const PLASMA_desc descA, PLASMA_enum direct, int k1, int k2, const int *ipiv, int *rankin, int *rankout, float *A, int lda, int init)
Definition: core_slacpy_pivot.c:84
int CORE_spltmg_hankel(PLASMA_enum uplo, int M, int N, float *A, int LDA, int m0, int n0, int nb, const float *V1, const float *V2)
Definition: core_spltmg_hankel.c:88
void CORE_sgemm(PLASMA_enum transA, PLASMA_enum transB, int M, int N, int K, float alpha, const float *A, int LDA, const float *B, int LDB, float beta, float *C, int LDC)
Definition: core_sgemm.c:90
int CORE_sormqr(PLASMA_enum side, PLASMA_enum trans, int M, int N, int K, int IB, const float *V, int LDV, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_sormqr.c:108
void CORE_slaset2(PLASMA_enum uplo, int n1, int n2, float alpha, float *tileA, int ldtilea)
Definition: core_slaset2.c:55
int CORE_stslqt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_stslqt.c:107
void CORE_slarfy(int N, float *A, int LDA, const float *V, const float *TAU, float *WORK)
Definition: core_slarfy.c:61
int CORE_sgetrf_nopiv(int m, int n, int ib, float *A, int lda)
Definition: core_sgetrf_nopiv.c:69
void CORE_sgetrip(int m, int n, float *A, float *work)
Definition: core_sgetrip.c:51
int CORE_shbelr(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_shbelr.c:80
void CORE_spltmg_toeppd1(int gM, int m0, int M, float *W, unsigned long long int seed)
Definition: core_spltmg_toeppd.c:70
int CORE_sormlq(PLASMA_enum side, PLASMA_enum trans, int M, int N, int IB, int K, const float *V, int LDV, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_sormlq.c:108
int CORE_slascl(PLASMA_enum type, int kl, int ku, float cfrom, float cto, int m, int n, float *A, int lda)
Definition: core_slascl.c:72
int CORE_sttlqt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sttlqt.c:116
int CORE_sgetrf_reclap(int M, int N, float *A, int LDA, int *IPIV, int *info)
Definition: core_sgetrf_reclap.c:111
void CORE_splgsy(float bump, int m, int n, float *A, int lda, int bigM, int m0, int n0, unsigned long long int seed)
Definition: core_splgsy.c:72
void CORE_sgemv(PLASMA_enum trans, int M, int N, float alpha, const float *A, int LDA, const float *x, int incx, float beta, float *y, int incy)
Definition: core_sgemv.c:78
int CORE_slarfb_gemm(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev, int M, int N, int K, const float *V, int LDV, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_slarfb_gemm.c:113
void CORE_ssetvar(const float *alpha, float *x)
Definition: core_ssetvar.c:37
int CORE_stsmlq_sytra1(PLASMA_enum side, PLASMA_enum trans, int m1, int n1, int m2, int n2, int k, int ib, float *A1, int lda1, float *A2, int lda2, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmlq_sytra1.c:125
int CORE_slaswpc_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc)
Definition: core_slaswp.c:296
int CORE_spemv(PLASMA_enum trans, PLASMA_enum storev, int M, int N, int L, float ALPHA, const float *A, int LDA, const float *X, int INCX, float BETA, float *Y, int INCY, float *WORK)
Definition: core_spemv.c:118
int CORE_sgelqt(int M, int N, int IB, float *A, int LDA, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sgelqt.c:85
void CORE_sgbtype2cb(PLASMA_enum uplo, int N, int NB, float *A, int LDA, float *VQ, float *TAUQ, float *VP, float *TAUP, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_sgbtype2cb.c:105
void CORE_slaswp(int N, float *A, int LDA, int I1, int I2, const int *IPIV, int INC)
Definition: core_slaswp.c:62
int CORE_stsqrt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_stsqrt.c:97
void CORE_strtri(PLASMA_enum uplo, PLASMA_enum diag, int N, float *A, int LDA, int *info)
Definition: core_strtri.c:66
void CORE_ssymm(PLASMA_enum side, PLASMA_enum uplo, int M, int N, float alpha, const float *A, int LDA, const float *B, int LDB, float beta, float *C, int LDC)
Definition: core_ssymm.c:88
void CORE_sasum(int storev, PLASMA_enum uplo, int M, int N, const float *A, int lda, float *work)
Definition: core_sasum.c:61
int CORE_sssssm(int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *L1, int LDL1, const float *L2, int LDL2, const int *IPIV)
Definition: core_sssssm.c:94
void CORE_slacpy(PLASMA_enum uplo, int M, int N, const float *A, int LDA, float *B, int LDB)
Definition: core_slacpy.c:59
Definition: descriptor.h:41
void CORE_spltmg_fiedler(int m, int n, const float *X, int incX, const float *Y, int incY, float *A, int lda)
Definition: core_spltmg_fiedler.c:75
int CORE_sgetrf_rectil(const PLASMA_desc A, int *IPIV, int *info)
Definition: core_sgetrf_rectil.c:110
void CORE_slansy(int norm, PLASMA_enum uplo, int N, const float *A, int LDA, float *work, float *normA)
Definition: core_slansy.c:74
void CORE_spltmg_toeppd2(int M, int N, int K, int m0, int n0, const float *W, float *A, int LDA)
Definition: core_spltmg_toeppd.c:149
int CORE_spltmg_circul(int M, int N, float *A, int LDA, int gM, int m0, int n0, const float *V)
Definition: core_spltmg_circul.c:76
int CORE_sgblrx(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_sgblrx.c:80
void CORE_sswpab(int i, int n1, int n2, float *A, float *work)
Definition: core_sswpab.c:63
int CORE_sgeadd(int M, int N, float alpha, const float *A, int LDA, float *B, int LDB)
Definition: core_sgeadd.c:59
int CORE_ststrf(int M, int N, int IB, int NB, float *U, int LDU, float *A, int LDA, float *L, int LDL, int *IPIV, float *WORK, int LDWORK, int *INFO)
Definition: core_ststrf.c:99
void CORE_sgeqp3_init(int n, int *jpvt)
Definition: core_sgeqp3_init.c:38
void CORE_ssyr2k(PLASMA_enum uplo, PLASMA_enum trans, int N, int K, float alpha, const float *A, int LDA, const float *B, int LDB, float beta, float *C, int LDC)
Definition: core_ssyr2k.c:90
void CORE_sgbtype3cb(PLASMA_enum uplo, int N, int NB, float *A, int LDA, float *VQ, float *TAUQ, float *VP, float *TAUP, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_sgbtype3cb.c:103
int CORE_sgetrf(int M, int N, float *A, int LDA, int *IPIV, int *INFO)
Definition: core_sgetrf.c:60