18 #ifndef _PLASMA_CORE_SBLAS_H_
19 #define _PLASMA_CORE_SBLAS_H_
33 void CORE_sasum(
int storev, PLASMA_enum uplo,
int M,
int N,
34 const float *A,
int lda,
float *work);
44 int Vblksiz,
int wantz,
45 int i,
int sweepid,
int m,
int grsiz,
49 int st,
int ed,
int eltsize);
52 int st,
int ed,
int eltsize);
55 int st,
int ed,
int eltsize);
58 const float *A,
int LDA,
66 void CORE_sgemm(PLASMA_enum transA, PLASMA_enum transB,
68 float alpha,
const float *A,
int LDA,
69 const float *B,
int LDB,
70 float beta,
float *C,
int LDC);
71 void CORE_sgemv(PLASMA_enum trans,
int M,
int N,
72 float alpha,
const float *A,
int LDA,
73 const float *x,
int incx,
74 float beta,
float *y,
int incy);
77 float *tau,
float *beta );
80 int jj,
int k,
int *jpvt,
81 float *norms1,
float *norms2,
int *info );
82 int CORE_sgeqp3_tntpiv(
int m,
int n,
84 int *IPIV,
float *tau,
88 const float *Fk,
int ldf,
89 int joff,
int k,
int koff,
int nb,
90 float *norms1,
float *norms2,
95 float *TAU,
float *WORK);
98 const float *L,
int LDL,
100 int CORE_sgessq(
int M,
int N,
101 const float *A,
int LDA,
102 float *scale,
float *sumsq);
107 int *IPIV,
int *INFO);
110 int *IPIV,
int *INFO);
115 int *IPIV,
int *info);
123 int st,
int ed,
int eltsize);
126 int st,
int ed,
int eltsize);
129 int st,
int ed,
int eltsize);
132 float *V,
float *TAU,
133 int st,
int ed,
int sweep,
int Vblksiz,
int WANTZ,
137 float *V,
float *TAU,
138 int st,
int ed,
int sweep,
int Vblksiz,
int WANTZ,
142 const float *V,
const float *TAU,
143 int st,
int ed,
int sweep,
int Vblksiz,
int WANTZ,
147 float *VQ,
float *TAUQ,
148 float *VP,
float *TAUP,
149 int st,
int ed,
int sweep,
int Vblksiz,
int WANTZ,
153 float *VQ,
float *TAUQ,
154 float *VP,
float *TAUP,
155 int st,
int ed,
int sweep,
int Vblksiz,
int WANTZ,
159 float *VQ,
float *TAUQ,
160 float *VP,
float *TAUP,
161 int st,
int ed,
int sweep,
int Vblksiz,
int WANTZ,
163 void CORE_ssygst(
int itype, PLASMA_enum uplo,
int N,
165 float *B,
int LDB,
int *INFO);
167 void CORE_ssymm(PLASMA_enum side, PLASMA_enum uplo,
169 float alpha,
const float *A,
int LDA,
170 const float *B,
int LDB,
171 float beta,
float *C,
int LDC);
172 void CORE_ssyrk(PLASMA_enum uplo, PLASMA_enum trans,
174 float alpha,
const float *A,
int LDA,
175 float beta,
float *C,
int LDC);
176 void CORE_ssyr2k(PLASMA_enum uplo, PLASMA_enum trans,
178 float alpha,
const float *A,
int LDA,
179 const float *B,
int LDB,
180 float beta,
float *C,
int LDC);
181 int CORE_shessq(PLASMA_enum uplo,
int N,
182 const float *A,
int LDA,
183 float *scale,
float *sumsq);
185 int CORE_ssyrfb(PLASMA_enum uplo,
int N,
int K,
int IB,
int NB,
186 const float *A,
int LDA,
187 const float *T,
int LDT,
189 float *WORK,
int LDWORK);
191 const float *A,
int LDA,
195 int k1,
int k2,
const int *ipiv,
196 int *rankin,
int *rankout,
200 const float *A,
int LDA,
201 float *work,
float *normA);
203 void CORE_slansy(
int norm, PLASMA_enum uplo,
int N,
204 const float *A,
int LDA,
205 float *work,
float *normA);
207 void CORE_slansy(
int norm, PLASMA_enum uplo,
int N,
208 const float *A,
int LDA,
209 float *work,
float *normA);
210 void CORE_slantr(PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag,
212 const float *A,
int LDA,
213 float *work,
float *normA);
214 int CORE_slarfb_gemm(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev,
216 const float *V,
int LDV,
217 const float *T,
int LDT,
219 float *WORK,
int LDWORK);
224 float *C2,
int LDC2);
243 float alpha,
float *A,
int lda);
245 float alpha,
float beta,
246 float *tileA,
int ldtilea);
247 void CORE_slaset2(PLASMA_enum uplo,
int n1,
int n2,
float alpha,
248 float *tileA,
int ldtilea);
250 int I1,
int I2,
const int *IPIV,
int INC);
253 int CORE_slatro(PLASMA_enum uplo, PLASMA_enum trans,
255 const float *A,
int LDA,
257 void CORE_slauum(PLASMA_enum uplo,
int N,
float *A,
int LDA);
258 int CORE_spamm(
int op, PLASMA_enum side, PLASMA_enum storev,
259 int M,
int N,
int K,
int L,
260 const float *A1,
int LDA1,
262 const float *V,
int LDV,
264 int CORE_sparfb(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev,
265 int M1,
int N1,
int M2,
int N2,
int K,
int L,
268 const float *V,
int LDV,
269 const float *T,
int LDT,
270 float *WORK,
int LDWORK);
271 int CORE_spemv(PLASMA_enum trans, PLASMA_enum storev,
274 const float *A,
int LDA,
275 const float *X,
int INCX,
279 void CORE_splgsy(
float bump,
int m,
int n,
float *A,
int lda,
280 int bigM,
int m0,
int n0,
unsigned long long int seed );
281 void CORE_splgsy(
float bump,
int m,
int n,
float *A,
int lda,
282 int bigM,
int m0,
int n0,
unsigned long long int seed );
284 int bigM,
int m0,
int n0,
unsigned long long int seed );
285 int CORE_spltmg(PLASMA_enum mtxtype,
int m,
int n,
float *A,
int lda,
286 int gM,
int gN,
int m0,
int n0,
unsigned long long int seed );
288 int gN,
int m0,
int n0,
291 int gM,
int m0,
int n0,
295 const float *X,
int incX,
296 const float *Y,
int incY,
299 int m0,
int n0,
int nb,
303 unsigned long long int seed );
307 void CORE_spotrf(PLASMA_enum uplo,
int N,
float *A,
int LDA,
int *INFO);
309 void CORE_sshift(
int s,
int m,
int n,
int L,
313 int CORE_sssssm(
int M1,
int N1,
int M2,
int N2,
int K,
int IB,
316 const float *L1,
int LDL1,
317 const float *L2,
int LDL2,
322 float *WORK,
int LWORK,
324 float *RWORK,
int LRWORK,
326 int *IWORK,
int LIWORK);
331 void CORE_ssymm(PLASMA_enum side, PLASMA_enum uplo,
333 float alpha,
const float *A,
int LDA,
334 const float *B,
int LDB,
335 float beta,
float *C,
int LDC);
336 void CORE_ssyrk(PLASMA_enum uplo, PLASMA_enum trans,
338 float alpha,
const float *A,
int LDA,
339 float beta,
float *C,
int LDC);
340 void CORE_ssyr2k(PLASMA_enum uplo, PLASMA_enum trans,
342 float alpha,
const float *A,
int LDA,
343 const float *B,
int LDB,
344 float beta,
float *C,
int LDC);
345 int CORE_ssyssq(PLASMA_enum uplo,
int N,
346 const float *A,
int LDA,
347 float *scale,
float *sumsq);
349 float *A,
float *work);
351 const float *Akk,
int ldak);
352 int CORE_stradd(PLASMA_enum uplo, PLASMA_enum trans,
int M,
int N,
354 const float *A,
int LDA,
357 void CORE_strasm(PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag,
358 int M,
int N,
const float *A,
int lda,
float *work);
365 int Vblksiz,
int wantz,
366 int i,
int sweepid,
int m,
int grsiz,
368 void CORE_strmm(PLASMA_enum side, PLASMA_enum uplo,
369 PLASMA_enum transA, PLASMA_enum diag,
371 float alpha,
const float *A,
int LDA,
373 void CORE_strsm(PLASMA_enum side, PLASMA_enum uplo,
374 PLASMA_enum transA, PLASMA_enum diag,
376 float alpha,
const float *A,
int LDA,
378 int CORE_strssq(PLASMA_enum uplo, PLASMA_enum diag,
int M,
int N,
379 const float *A,
int LDA,
380 float *scale,
float *sumsq);
381 void CORE_strtri(PLASMA_enum uplo, PLASMA_enum diag,
int N,
382 float *A,
int LDA,
int *info);
387 float *TAU,
float *WORK);
388 int CORE_stsmlq(PLASMA_enum side, PLASMA_enum trans,
389 int M1,
int N1,
int M2,
int N2,
int K,
int IB,
392 const float *V,
int LDV,
393 const float *T,
int LDT,
394 float *WORK,
int LDWORK);
396 int k,
int ib,
int nb,
400 const float *V,
int ldv,
401 const float *T,
int ldt,
402 float *WORK,
int ldwork);
404 int m1,
int n1,
int m2,
int n2,
408 const float *V,
int ldv,
409 const float *T,
int ldt,
410 float *WORK,
int ldwork);
411 int CORE_stsmqr(PLASMA_enum side, PLASMA_enum trans,
412 int M1,
int N1,
int M2,
int N2,
int K,
int IB,
415 const float *V,
int LDV,
416 const float *T,
int LDT,
417 float *WORK,
int LDWORK);
419 int k,
int ib,
int nb,
423 const float *V,
int ldv,
424 const float *T,
int ldt,
425 float *WORK,
int ldwork);
427 int m1,
int n1,
int m2,
int n2,
431 const float *V,
int ldv,
432 const float *T,
int ldt,
433 float *WORK,
int ldwork);
438 float *TAU,
float *WORK);
443 int *IPIV,
float *WORK,
444 int LDWORK,
int *INFO);
445 int CORE_sttmqr(PLASMA_enum side, PLASMA_enum trans,
446 int M1,
int N1,
int M2,
int N2,
int K,
int IB,
449 const float *V,
int LDV,
450 const float *T,
int LDT,
451 float *WORK,
int LDWORK);
458 int CORE_sttmlq(PLASMA_enum side, PLASMA_enum trans,
459 int M1,
int N1,
int M2,
int N2,
int K,
int IB,
462 const float *V,
int LDV,
463 const float *T,
int LDT,
464 float *WORK,
int LDWORK);
471 int CORE_sormlq(PLASMA_enum side, PLASMA_enum trans,
472 int M,
int N,
int IB,
int K,
473 const float *V,
int LDV,
474 const float *T,
int LDT,
476 float *WORK,
int LDWORK);
477 int CORE_sormqr(PLASMA_enum side, PLASMA_enum trans,
478 int M,
int N,
int K,
int IB,
479 const float *V,
int LDV,
480 const float *T,
int LDT,
482 float *WORK,
int LDWORK);
486 float *beta,
float *D,
float *Q,
int LDQ,
487 float *Z,
float *DLAMBDA,
float *W,
488 int *INDX,
int *INDXC,
int *INDXP,
int *INDXQ,
491 const float *Q,
int LDQ,
float *Q2,
494 float *Q,
int LDQ,
const float *Q2,
497 float *D,
float beta,
499 const float *D0,
const float *Z,
501 int start,
int end );
503 const float *Q,
int LDQ,
504 const float *DLAMBDA,
float *W,
508 const float *Q,
int LDQ,
509 const float *Wred,
float *W);
511 float *Q,
int LDQ,
float *W,
float *S,
516 int il_nondef,
int iu_nondef,
517 float *Q,
int ldq,
float *Q2,
518 const int *ctot,
float *WORK,
int start,
int end);
520 void CORE_sswap(
int m,
int n,
float *Q,
int ldq,
521 const float *work,
const int *perm,
523 int CORE_slascl(PLASMA_enum type,
int kl,
int ku,
float cfrom,
float cto,
524 int m,
int n,
float *A,
int lda);
526 int CORE_slag2c(
int m,
int n,
const float *Q,
int LDQ,
531 void CORE_slaed3_freebigwork(
int oper,
float **WORK);
533 float *D,
const float *E);
534 int CORE_slapst(PLASMA_enum type,
int n,
535 const float *D,
int *INDX);
542 void QUARK_CORE_sasum(Quark *quark, Quark_Task_Flags *task_flags,
543 PLASMA_enum storev, PLASMA_enum uplo,
int m,
int n,
544 const float *A,
int lda,
int szeA,
545 float *work,
int szeW);
546 void QUARK_CORE_sasum_f1(Quark *quark, Quark_Task_Flags *task_flags,
547 PLASMA_enum storev, PLASMA_enum uplo,
int m,
int n,
548 const float *A,
int lda,
int szeA,
549 float *work,
int szeW,
550 float *fake,
int szeF);
551 void QUARK_CORE_sgeadd(Quark *quark, Quark_Task_Flags *task_flags,
552 PLASMA_enum trans,
int m,
int n,
int nb,
554 const float *A,
int lda,
557 void QUARK_CORE_sbrdalg1(Quark *quark, Quark_Task_Flags *task_flags,
566 int Vblksiz,
int wantz,
567 int i,
int sweepid,
int m,
int grsiz,
568 int *PCOL,
int *ACOL,
int *MCOL);
569 void QUARK_CORE_sgelqt(Quark *quark, Quark_Task_Flags *task_flags,
570 int m,
int n,
int ib,
int nb,
573 void QUARK_CORE_sgemm(Quark *quark, Quark_Task_Flags *task_flags,
574 PLASMA_enum transA, PLASMA_enum transB,
575 int m,
int n,
int k,
int nb,
576 float alpha,
const float *A,
int lda,
577 const float *B,
int ldb,
578 float beta,
float *C,
int ldc);
579 void QUARK_CORE_sgemm2( Quark *quark, Quark_Task_Flags *task_flags,
580 PLASMA_enum transA, PLASMA_enum transB,
581 int m,
int n,
int k,
int nb,
582 float alpha,
const float *A,
int lda,
583 const float *B,
int ldb,
584 float beta,
float *C,
int ldc);
585 void QUARK_CORE_sgemm_f2(Quark *quark, Quark_Task_Flags *task_flags,
586 PLASMA_enum transA, PLASMA_enum transB,
587 int m,
int n,
int k,
int nb,
588 float alpha,
const float *A,
int lda,
589 const float *B,
int ldb,
590 float beta,
float *C,
int ldc,
591 float *fake1,
int szefake1,
int flag1,
592 float *fake2,
int szefake2,
int flag2);
593 void QUARK_CORE_sgemm_p2(Quark *quark, Quark_Task_Flags *task_flags,
594 PLASMA_enum transA, PLASMA_enum transB,
595 int m,
int n,
int k,
int nb,
596 float alpha,
const float *A,
int lda,
597 const float **B,
int ldb,
598 float beta,
float *C,
int ldc);
599 void QUARK_CORE_sgemm_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
600 PLASMA_enum transA, PLASMA_enum transB,
601 int m,
int n,
int k,
int nb,
602 float alpha,
const float *A,
int lda,
603 const float **B,
int ldb,
604 float beta,
float *C,
int ldc,
605 float *fake1,
int szefake1,
int flag1);
606 void QUARK_CORE_sgemm_p3(Quark *quark, Quark_Task_Flags *task_flags,
607 PLASMA_enum transA, PLASMA_enum transB,
608 int m,
int n,
int k,
int nb,
609 float alpha,
const float *A,
int lda,
610 const float *B,
int ldb,
611 float beta,
float **C,
int ldc);
612 void QUARK_CORE_sgemm_tile(Quark *quark, Quark_Task_Flags *task_flags,
613 PLASMA_enum transA, PLASMA_enum transB,
614 int m,
int n,
int k,
int nb,
615 const float *alpha,
const float *A,
int lda,
616 const float *B,
int ldb,
617 const float *beta,
float *C,
int ldc,
621 void QUARK_CORE_sgemv(Quark *quark, Quark_Task_Flags *task_flags,
622 PLASMA_enum trans,
int m,
int n,
623 float alpha,
const float *A,
int lda,
624 const float *x,
int incx,
625 float beta,
float *y,
int incy);
626 void QUARK_CORE_sgemv_tile(Quark *quark, Quark_Task_Flags *task_flags,
629 const float *alpha,
const float *A,
int lda,
630 const float *x,
int incx,
631 const float *beta,
float *y,
int incy,
635 void QUARK_CORE_sgeqp3_init( Quark *quark, Quark_Task_Flags *task_flags,
637 void QUARK_CORE_sgeqp3_larfg(Quark *quark, Quark_Task_Flags *task_flags,
639 float *tau,
float *beta );
640 void QUARK_CORE_sgeqp3_norms( Quark *quark, Quark_Task_Flags *task_flags,
641 PLASMA_desc A,
int ioff,
int joff,
float *norms1,
float *norms2 );
642 void QUARK_CORE_sgeqp3_pivot( Quark *quark, Quark_Task_Flags *task_flags,
645 int jj,
int k,
int *jpvt,
646 float *norms1,
float *norms2,
int *info );
647 void QUARK_CORE_sgeqp3_tntpiv(Quark *quark, Quark_Task_Flags *task_flags,
648 int m,
int n,
int nb,
652 PLASMA_bool check_info,
int iinfo);
653 void QUARK_CORE_sgeqp3_update( Quark *quark, Quark_Task_Flags *task_flags,
654 float *Ajj,
int lda1,
655 float *Ajk,
int lda2,
657 int joff,
int k,
int koff,
int nb,
658 float *norms1,
float *norms2,
int *info );
659 void QUARK_CORE_sgeqrt(Quark *quark, Quark_Task_Flags *task_flags,
660 int m,
int n,
int ib,
int nb,
663 void QUARK_CORE_sgessm(Quark *quark, Quark_Task_Flags *task_flags,
664 int m,
int n,
int k,
int ib,
int nb,
666 const float *L,
int ldl,
668 void QUARK_CORE_sgessq_f1( Quark *quark, Quark_Task_Flags *task_flags,
669 int m,
int n,
const float *A,
int lda,
670 float *scale,
float *sumsq,
671 float *fake,
int szeF,
int paramF );
672 void QUARK_CORE_sgetrf(Quark *quark, Quark_Task_Flags *task_flags,
673 int m,
int n,
int nb,
677 PLASMA_bool check_info,
int iinfo);
678 void QUARK_CORE_sgetrf_incpiv(Quark *quark, Quark_Task_Flags *task_flags,
679 int m,
int n,
int ib,
int nb,
683 PLASMA_bool check_info,
int iinfo);
684 void QUARK_CORE_sgetrf_nopiv(Quark *quark, Quark_Task_Flags *task_flags,
685 int m,
int n,
int ib,
int nb,
689 void QUARK_CORE_sgetrf_reclap(Quark *quark, Quark_Task_Flags *task_flags,
694 PLASMA_bool check_info,
int iinfo,
696 void QUARK_CORE_sgetrf_rectil(Quark *quark, Quark_Task_Flags *task_flags,
701 PLASMA_bool check_info,
int iinfo,
703 void QUARK_CORE_sgetrip(Quark *quark, Quark_Task_Flags *task_flags,
704 int m,
int n,
float *A,
int szeA);
705 void QUARK_CORE_sgetrip_f1(Quark *quark, Quark_Task_Flags *task_flags,
706 int m,
int n,
float *A,
int szeA,
707 float *fake,
int szeF,
int paramF);
708 void QUARK_CORE_sgetrip_f2(Quark *quark, Quark_Task_Flags *task_flags,
709 int m,
int n,
float *A,
int szeA,
710 float *fake1,
int szeF1,
int paramF1,
711 float *fake2,
int szeF2,
int paramF2);
712 void QUARK_CORE_ssymm(Quark *quark, Quark_Task_Flags *task_flags,
713 PLASMA_enum side, PLASMA_enum uplo,
714 int m,
int n,
int nb,
715 float alpha,
const float *A,
int lda,
716 const float *B,
int ldb,
717 float beta,
float *C,
int ldc);
718 void QUARK_CORE_ssygst(Quark *quark, Quark_Task_Flags *task_flags,
719 int itype, PLASMA_enum uplo,
int N,
724 void QUARK_CORE_ssyrk(Quark *quark, Quark_Task_Flags *task_flags,
725 PLASMA_enum uplo, PLASMA_enum trans,
726 int n,
int k,
int nb,
727 float alpha,
const float *A,
int lda,
728 float beta,
float *C,
int ldc);
729 void QUARK_CORE_ssyr2k(Quark *quark, Quark_Task_Flags *task_flags,
730 PLASMA_enum uplo, PLASMA_enum trans,
731 int n,
int k,
int nb,
732 float alpha,
const float *A,
int lda,
733 const float *B,
int LDB,
734 float beta,
float *C,
int ldc);
735 void QUARK_CORE_ssyrfb(Quark *quark, Quark_Task_Flags *task_flags,
737 int n,
int k,
int ib,
int nb,
738 const float *A,
int lda,
739 const float *T,
int ldt,
741 void QUARK_CORE_shessq_f1( Quark *quark, Quark_Task_Flags *task_flags,
742 PLASMA_enum uplo,
int n,
const float *A,
int lda,
743 float *scale,
float *sumsq,
744 float *fake,
int szeF,
int paramF );
745 void QUARK_CORE_slacpy(Quark *quark, Quark_Task_Flags *task_flags,
746 PLASMA_enum uplo,
int m,
int n,
int mb,
747 const float *A,
int lda,
749 void QUARK_CORE_slacpy_f1(Quark *quark, Quark_Task_Flags *task_flags,
750 PLASMA_enum uplo,
int m,
int n,
int nb,
751 const float *A,
int lda,
753 float *fake1,
int szefake1,
int flag1);
754 void QUARK_CORE_slacpy_pivot(Quark *quark, Quark_Task_Flags *task_flags,
757 int k1,
int k2,
const int *ipiv,
758 int *rankin,
int *rankout,
761 void QUARK_CORE_slange(Quark *quark, Quark_Task_Flags *task_flags,
762 int norm,
int M,
int N,
763 const float *A,
int LDA,
int szeA,
764 int szeW,
float *result);
765 void QUARK_CORE_slange_f1(Quark *quark, Quark_Task_Flags *task_flags,
766 int norm,
int M,
int N,
767 const float *A,
int LDA,
int szeA,
768 int szeW,
float *result,
769 float *fake,
int szeF);
771 void QUARK_CORE_slansy(Quark *quark, Quark_Task_Flags *task_flags,
772 int norm, PLASMA_enum uplo,
int N,
773 const float *A,
int LDA,
int szeA,
774 int szeW,
float *result);
775 void QUARK_CORE_slansy_f1(Quark *quark, Quark_Task_Flags *task_flags,
776 int norm, PLASMA_enum uplo,
int N,
777 const float *A,
int LDA,
int szeA,
778 int szeW,
float *result,
779 float *fake,
int szeF);
781 void QUARK_CORE_slansy(Quark *quark, Quark_Task_Flags *task_flags,
782 int norm, PLASMA_enum uplo,
int N,
783 const float *A,
int LDA,
int szeA,
784 int szeW,
float *result);
785 void QUARK_CORE_slansy_f1(Quark *quark, Quark_Task_Flags *task_flags,
786 int norm, PLASMA_enum uplo,
int N,
787 const float *A,
int LDA,
int szeA,
788 int szeW,
float *result,
789 float *fake,
int szeF);
790 void QUARK_CORE_slantr(Quark *quark, Quark_Task_Flags *task_flags,
791 PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag,
int M,
int N,
792 const float *A,
int LDA,
int szeA,
793 int szeW,
float *result);
794 void QUARK_CORE_slantr_f1(Quark *quark, Quark_Task_Flags *task_flags,
795 PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag,
int M,
int N,
796 const float *A,
int LDA,
int szeA,
797 int szeW,
float *result,
798 float *fake,
int szeF);
799 void QUARK_CORE_slascal(Quark *quark, Quark_Task_Flags *task_flags,
800 PLASMA_enum uplo,
int m,
int n,
int nb,
801 float alpha,
float *A,
int lda);
802 void QUARK_CORE_slaset(Quark *quark, Quark_Task_Flags *task_flags,
803 PLASMA_enum uplo,
int n1,
int n2,
float alpha,
804 float beta,
float *tileA,
int ldtilea);
805 void QUARK_CORE_slaset2(Quark *quark, Quark_Task_Flags *task_flags,
806 PLASMA_enum uplo,
int n1,
int n2,
float alpha,
807 float *tileA,
int ldtilea);
808 void QUARK_CORE_slaswp(Quark *quark, Quark_Task_Flags *task_flags,
809 int n,
float *A,
int lda,
810 int i1,
int i2,
const int *ipiv,
int inc);
811 void QUARK_CORE_slaswp_f2(Quark *quark, Quark_Task_Flags *task_flags,
812 int n,
float *A,
int lda,
813 int i1,
int i2,
const int *ipiv,
int inc,
814 float *fake1,
int szefake1,
int flag1,
815 float *fake2,
int szefake2,
int flag2);
816 void QUARK_CORE_slaswp_ontile(Quark *quark, Quark_Task_Flags *task_flags,
818 int i1,
int i2,
const int *ipiv,
int inc,
float *fakepanel);
819 void QUARK_CORE_slaswp_ontile_f2(Quark *quark, Quark_Task_Flags *task_flags,
821 int i1,
int i2,
const int *ipiv,
int inc,
822 float *fake1,
int szefake1,
int flag1,
823 float *fake2,
int szefake2,
int flag2);
824 void QUARK_CORE_slaswpc_ontile(Quark *quark, Quark_Task_Flags *task_flags,
826 int i1,
int i2,
const int *ipiv,
int inc,
float *fakepanel);
827 void QUARK_CORE_slatro(Quark *quark, Quark_Task_Flags *task_flags,
828 PLASMA_enum uplo, PLASMA_enum trans,
int m,
int n,
int mb,
829 const float *A,
int lda,
831 void QUARK_CORE_slatro_f1(Quark *quark, Quark_Task_Flags *task_flags,
832 PLASMA_enum uplo, PLASMA_enum trans,
int m,
int n,
int mb,
833 const float *A,
int lda,
835 float *fake1,
int szefake1,
int flag1);
836 void QUARK_CORE_slauum(Quark *quark, Quark_Task_Flags *task_flags,
837 PLASMA_enum uplo,
int n,
int nb,
839 void QUARK_CORE_splgsy(Quark *quark, Quark_Task_Flags *task_flags,
840 float bump,
int m,
int n,
float *A,
int lda,
841 int bigM,
int m0,
int n0,
unsigned long long int seed );
842 void QUARK_CORE_splgsy(Quark *quark, Quark_Task_Flags *task_flags,
843 float bump,
int m,
int n,
float *A,
int lda,
844 int bigM,
int m0,
int n0,
unsigned long long int seed );
845 void QUARK_CORE_splrnt(Quark *quark, Quark_Task_Flags *task_flags,
846 int m,
int n,
float *A,
int lda,
847 int bigM,
int m0,
int n0,
unsigned long long int seed );
848 void QUARK_CORE_spltmg(Quark *quark, Quark_Task_Flags *task_flags,
849 PLASMA_enum mtxtype,
int m,
int n,
float *A,
int lda,
850 int gM,
int gN,
int m0,
int n0,
unsigned long long int seed );
851 void QUARK_CORE_spltmg_chebvand( Quark *quark, Quark_Task_Flags *task_flags,
852 int M,
int N,
float *A,
int LDA,
853 int gN,
int m0,
int n0,
855 void QUARK_CORE_spltmg_circul( Quark *quark, Quark_Task_Flags *task_flags,
856 int M,
int N,
float *A,
int LDA,
857 int gM,
int m0,
int n0,
859 void QUARK_CORE_spltmg_fiedler(Quark *quark, Quark_Task_Flags *task_flags,
861 const float *X,
int incX,
862 const float *Y,
int incY,
864 void QUARK_CORE_spltmg_hankel( Quark *quark, Quark_Task_Flags *task_flags,
865 PLASMA_enum uplo,
int M,
int N,
float *A,
int LDA,
866 int m0,
int n0,
int nb,
869 void QUARK_CORE_spltmg_toeppd1(Quark *quark, Quark_Task_Flags *task_flags,
870 int gM,
int m0,
int M,
872 unsigned long long int seed);
873 void QUARK_CORE_spltmg_toeppd2(Quark *quark, Quark_Task_Flags *task_flags,
874 int M,
int N,
int K,
int m0,
int n0,
877 void QUARK_CORE_spotrf(Quark *quark, Quark_Task_Flags *task_flags,
878 PLASMA_enum uplo,
int n,
int nb,
882 void QUARK_CORE_ssetvar(Quark *quark, Quark_Task_Flags *task_flags,
883 const float *alpha,
float *x,
885 void QUARK_CORE_sshift( Quark *quark, Quark_Task_Flags *task_flags,
886 int s,
int m,
int n,
int L,
888 void QUARK_CORE_sshiftw(Quark *quark, Quark_Task_Flags *task_flags,
889 int s,
int cl,
int m,
int n,
int L,
891 void QUARK_CORE_sssssm(Quark *quark, Quark_Task_Flags *task_flags,
892 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
895 const float *L1,
int ldl1,
896 const float *L2,
int ldl2,
898 void QUARK_CORE_sstedc(Quark *quark, Quark_Task_Flags *task_flags,
899 PLASMA_enum compz,
int n,
902 void QUARK_CORE_sstedc_f2(Quark *quark, Quark_Task_Flags *task_flags,
903 PLASMA_enum compz,
int n,
906 void *fake1,
int szefake1,
int flag1,
907 void *fake2,
int szefake2,
int flag2);
908 void QUARK_CORE_ssteqr(Quark *quark, Quark_Task_Flags *task_flags,
909 PLASMA_enum compz,
int n,
912 void QUARK_CORE_ssymm(Quark *quark, Quark_Task_Flags *task_flags,
913 PLASMA_enum side, PLASMA_enum uplo,
914 int m,
int n,
int nb,
915 float alpha,
const float *A,
int lda,
916 const float *B,
int ldb,
917 float beta,
float *C,
int ldc);
918 void QUARK_CORE_ssyrk(Quark *quark, Quark_Task_Flags *task_flags,
919 PLASMA_enum uplo, PLASMA_enum trans,
920 int n,
int k,
int nb,
921 float alpha,
const float *A,
int lda,
922 float beta,
float *C,
int ldc);
923 void QUARK_CORE_ssyr2k(Quark *quark, Quark_Task_Flags *task_flags,
924 PLASMA_enum uplo, PLASMA_enum trans,
925 int n,
int k,
int nb,
926 float alpha,
const float *A,
int lda,
927 const float *B,
int LDB,
928 float beta,
float *C,
int ldc);
929 void QUARK_CORE_ssyssq_f1( Quark *quark, Quark_Task_Flags *task_flags,
930 PLASMA_enum uplo,
int n,
const float *A,
int lda,
931 float *scale,
float *sumsq,
932 float *fake,
int szeF,
int paramF );
933 void QUARK_CORE_sswpab(Quark *quark, Quark_Task_Flags *task_flags,
934 int i,
int n1,
int n2,
936 void QUARK_CORE_sswptr_ontile(Quark *quark, Quark_Task_Flags *task_flags,
938 int i1,
int i2,
const int *ipiv,
int inc,
939 const float *Akk,
int ldak);
940 void QUARK_CORE_stradd(Quark *quark, Quark_Task_Flags *task_flags,
941 PLASMA_enum uplo, PLASMA_enum trans,
int m,
int n,
int nb,
943 const float *A,
int lda,
946 void QUARK_CORE_strasm(Quark *quark, Quark_Task_Flags *task_flags,
947 PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag,
int m,
int n,
948 const float *A,
int lda,
int szeA,
949 float *work,
int szeW);
950 void QUARK_CORE_strasm_f1(Quark *quark, Quark_Task_Flags *task_flags,
951 PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag,
int m,
int n,
952 const float *A,
int lda,
int szeA,
953 float *work,
int szeW,
954 float *fake,
int szeF);
955 void QUARK_CORE_strdalg1(Quark *quark, Quark_Task_Flags *task_flags,
962 int Vblksiz,
int wantz,
963 int i,
int sweepid,
int m,
int grsiz,
964 int *PCOL,
int *ACOL,
int *MCOL);
965 void QUARK_CORE_strmm(Quark *quark, Quark_Task_Flags *task_flags,
966 PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag,
967 int m,
int n,
int nb,
968 float alpha,
const float *A,
int lda,
970 void QUARK_CORE_strmm_p2(Quark *quark, Quark_Task_Flags *task_flags,
971 PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag,
972 int m,
int n,
int nb,
973 float alpha,
const float *A,
int lda,
975 void QUARK_CORE_strsm(Quark *quark, Quark_Task_Flags *task_flags,
976 PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag,
977 int m,
int n,
int nb,
978 float alpha,
const float *A,
int lda,
980 void QUARK_CORE_strssq_f1( Quark *quark, Quark_Task_Flags *task_flags,
981 PLASMA_enum uplo, PLASMA_enum diag,
982 int m,
int n,
const float *A,
int lda,
983 float *scale,
float *sumsq,
984 float *fake,
int szeF,
int paramF );
985 void QUARK_CORE_strtri(Quark *quark, Quark_Task_Flags *task_flags,
986 PLASMA_enum uplo, PLASMA_enum diag,
int n,
int nb,
990 void QUARK_CORE_stslqt(Quark *quark, Quark_Task_Flags *task_flags,
991 int m,
int n,
int ib,
int nb,
995 void QUARK_CORE_stsmlq(Quark *quark, Quark_Task_Flags *task_flags,
996 PLASMA_enum side, PLASMA_enum trans,
997 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
1000 const float *V,
int ldv,
1001 const float *T,
int ldt);
1002 void QUARK_CORE_stsmlq_sytra1(Quark *quark, Quark_Task_Flags *task_flags,
1003 PLASMA_enum side, PLASMA_enum trans,
1004 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
1005 float *A1,
int lda1,
1006 float *A2,
int lda2,
1007 const float *V,
int ldv,
1008 const float *T,
int ldt);
1009 void QUARK_CORE_stsmlq_corner(Quark *quark, Quark_Task_Flags *task_flags,
1010 int m1,
int n1,
int m2,
int n2,
int m3,
int n3,
int k,
int ib,
int nb,
1011 float *A1,
int lda1,
1012 float *A2,
int lda2,
1013 float *A3,
int lda3,
1014 const float *V,
int ldv,
1015 const float *T,
int ldt);
1016 void QUARK_CORE_stsmqr(Quark *quark, Quark_Task_Flags *task_flags,
1017 PLASMA_enum side, PLASMA_enum trans,
1018 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
1019 float *A1,
int lda1,
1020 float *A2,
int lda2,
1021 const float *V,
int ldv,
1022 const float *T,
int ldt);
1023 void QUARK_CORE_stsmqr_sytra1(Quark *quark, Quark_Task_Flags *task_flags,
1024 PLASMA_enum side, PLASMA_enum trans,
1025 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
1026 float *A1,
int lda1,
1027 float *A2,
int lda2,
1028 const float *V,
int ldv,
1029 const float *T,
int ldt);
1030 void QUARK_CORE_stsmqr_corner(Quark *quark, Quark_Task_Flags *task_flags,
1031 int m1,
int n1,
int m2,
int n2,
int m3,
int n3,
int k,
int ib,
int nb,
1032 float *A1,
int lda1,
1033 float *A2,
int lda2,
1034 float *A3,
int lda3,
1035 const float *V,
int ldv,
1036 const float *T,
int ldt);
1037 void QUARK_CORE_stsqrt(Quark *quark, Quark_Task_Flags *task_flags,
1038 int m,
int n,
int ib,
int nb,
1039 float *A1,
int lda1,
1040 float *A2,
int lda2,
1042 void QUARK_CORE_ststrf(Quark *quark, Quark_Task_Flags *task_flags,
1043 int m,
int n,
int ib,
int nb,
1049 PLASMA_bool check_info,
int iinfo);
1050 void QUARK_CORE_sttmqr(Quark *quark, Quark_Task_Flags *task_flags,
1051 PLASMA_enum side, PLASMA_enum trans,
1052 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
1053 float *A1,
int lda1,
1054 float *A2,
int lda2,
1055 const float *V,
int ldv,
1056 const float *T,
int ldt);
1057 void QUARK_CORE_sttqrt(Quark *quark, Quark_Task_Flags *task_flags,
1058 int m,
int n,
int ib,
int nb,
1059 float *A1,
int lda1,
1060 float *A2,
int lda2,
1062 void QUARK_CORE_sttmlq(Quark *quark, Quark_Task_Flags *task_flags,
1063 PLASMA_enum side, PLASMA_enum trans,
1064 int m1,
int n1,
int m2,
int n2,
int k,
int ib,
int nb,
1065 float *A1,
int lda1,
1066 float *A2,
int lda2,
1067 const float *V,
int ldv,
1068 const float *T,
int ldt);
1069 void QUARK_CORE_sttlqt(Quark *quark, Quark_Task_Flags *task_flags,
1070 int m,
int n,
int ib,
int nb,
1071 float *A1,
int lda1,
1072 float *A2,
int lda2,
1074 void QUARK_CORE_spamm(Quark *quark, Quark_Task_Flags *task_flags,
1075 int op, PLASMA_enum side, PLASMA_enum storev,
1076 int m,
int n,
int k,
int l,
1077 const float *A1,
int lda1,
1078 float *A2,
int lda2,
1079 const float *V,
int ldv,
1081 void QUARK_CORE_splssq( Quark *quark, Quark_Task_Flags *task_flags,
1082 int m,
const float *A,
float *result );
1083 void QUARK_CORE_sormlq(Quark *quark, Quark_Task_Flags *task_flags,
1084 PLASMA_enum side, PLASMA_enum trans,
1085 int m,
int n,
int ib,
int nb,
int k,
1086 const float *A,
int lda,
1087 const float *T,
int ldt,
1089 void QUARK_CORE_sormqr(Quark *quark, Quark_Task_Flags *task_flags,
1090 PLASMA_enum side, PLASMA_enum trans,
1091 int m,
int n,
int k,
int ib,
int nb,
1092 const float *A,
int lda,
1093 const float *T,
int ldt,
1097 void QUARK_CORE_slascl(Quark *quark, Quark_Task_Flags *task_flags,
1098 PLASMA_enum type,
int kl,
int ku,
float cfrom,
float cto,
1099 int m,
int n,
float *A,
int lda);
1100 void QUARK_CORE_slascl_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
1101 PLASMA_enum type,
int kl,
int ku,
float *cfrom,
float *cto,
1102 int m,
int n,
float *A,
int lda,
1103 void *fake,
int szefake,
int flag);
1104 void QUARK_CORE_slaed0_lascl( Quark *quark, Quark_Task_Flags *task_flags,
1105 int n,
float *scale,
float *D,
float *E);
1106 void QUARK_CORE_slaed0_betaapprox(Quark *quark, Quark_Task_Flags *task_flags,
1107 int subpbs,
const int *subpbs_info,
1108 float *D,
const float *E);
1111 void QUARK_CORE_slaed2_computeK(Quark *quark, Quark_Task_Flags *task_flags,
1112 int *K1,
int n,
int n1,
1113 float *beta,
float *D,
float *Q,
int LDQ,
1114 float *Z,
float *DLAMBDA,
float *W,
1115 int *INDX,
int *INDXC,
int *INDXP,
int *INDXQ,
1117 float **Qmerge,
int wsmode,
1120 void QUARK_CORE_slaed1_pipelined(Quark *quark, Quark_Task_Flags *task_flags,
1121 int n,
int n1,
const int *K,
1122 const int *INDX,
const int *ctot,
1123 float *D,
const float *beta,
1124 float *Q,
int LDQ,
float *Q2,
1125 const float *DLAMBDA,
const float *W,
float *Wred,
1126 int start,
int end);
1127 void QUARK_CORE_slaed2_compressq(Quark *quark, Quark_Task_Flags *task_flags,
1128 int n,
int n1,
int start,
int end,
1129 const int *INDX,
const int *ctot,
1130 const float *Q,
int LDQ,
1132 void QUARK_CORE_slaed4_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
1133 int n,
const int *K,
1134 float *D,
const float *beta,
1135 float **Q,
const int *LDQ,
1136 const float *DLAMBDA,
const float *W,
const int *INDX,
1139 void *fakeQ,
int flagfQ);
1140 void QUARK_CORE_slaed3_compW_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
1141 int n,
const int *K,
1142 float **Q,
const int *LDQ,
1143 const float *DLAMBDA,
float *W,
1146 void *fakeQ,
int flagfQ,
1147 void *fakeW,
int flagfW);
1149 void QUARK_CORE_slaed3_reduceW(Quark *quark, Quark_Task_Flags *task_flags,
1150 int n,
int n1,
const int *K,
int l,
1151 const float *Q,
int LDQ,
1152 const float *Wred,
float *W);
1153 void QUARK_CORE_slaed3_reduceW_p2(Quark *quark, Quark_Task_Flags *task_flags,
1154 int n,
int n1,
const int *K,
int l,
1155 float **Q,
const int *LDQ,
1156 const float *Wred,
float *W);
1158 void QUARK_CORE_slaed2_copydef(Quark *quark, Quark_Task_Flags *task_flags,
1159 int n,
int n1,
const int *K,
const int *ctot,
1160 float *Q,
int LDQ,
const float *Q2,
1161 int start,
int end);
1162 void QUARK_CORE_slaed3_computevectors(Quark *quark, Quark_Task_Flags *task_flags,
1163 int wsmode,
int n,
const int *K,
1164 const int *il_nondef,
const int *iu_nondef,
1165 float *Q,
int LDQ,
float *W,
const int *INDXC,
1166 float **WSglobal,
float **WSlocal,
1167 int start,
int end );
1168 void QUARK_CORE_slaed3_wscopy( Quark *quark, Quark_Task_Flags *task_flags,
1169 const int *K,
const int *il_nondef,
const int *iu_nondef,
1170 const float *Q,
int LDQ,
float **WORK,
1171 int start,
int end );
1172 void QUARK_CORE_slaed3_updatevectors(Quark *quark, Quark_Task_Flags *task_flags,
1173 int oper,
int wsmode,
int n,
int n1,
int *K,
1174 int *il_nondef,
int *iu_nondef,
1175 float *D,
float *Q,
int LDQ,
float *Q2,
1176 int *INDXQ,
int *COLTYP,
float **WORK,
1177 int start,
int end,
float **WORKDEP);
1178 void QUARK_CORE_slaed3_pipelined(Quark *quark, Quark_Task_Flags *task_flags,
1179 int n,
int n1,
int *K,
int *il_nondef,
int *iu_nondef,
1180 float *D,
float *Q,
int LDQ,
float *Q2,
1181 int *INDXC,
int *INDXQ,
int *COLTYP,
float *W,
1182 int start,
int end2);
1184 void QUARK_CORE_sDC_fakedep(Quark *quark, Quark_Task_Flags *task_flags,
1185 int nb_tasks,
int nb,
float *Q,
int LDQ,
float *W);
1188 void QUARK_CORE_sswap(Quark *quark, Quark_Task_Flags *task_flags,
1189 int m,
int n,
float *Q,
1190 int LDQ,
float *work,
1191 int *perm,
int begin,
int end);
1193 void QUARK_CORE_slag2c(Quark *quark, Quark_Task_Flags *task_flags,
1195 const float *Q,
int LDQ,
1198 void QUARK_CORE_slaed3_freebigwork(Quark *quark, Quark_Task_Flags *task_flags,
1199 int *K_bis,
int largework,
float **WORK);
1200 void QUARK_CORE_slaset_identity(Quark *quark, Quark_Task_Flags *task_flags,
1201 int n,
int start,
int size,
1207 void CORE_sasum_quark(Quark *quark);
1208 void CORE_sasum_f1_quark(Quark *quark);
1209 void CORE_sgeadd_quark(Quark *quark);
1210 void CORE_sbrdalg1_quark(Quark *quark);
1211 void CORE_sgelqt_quark(Quark *quark);
1212 void CORE_sgemm_quark(Quark *quark);
1213 void CORE_sgemm_tile_quark(Quark *quark);
1214 void CORE_sgemv_quark(Quark *quark);
1215 void CORE_sgemv_tile_quark(Quark *quark);
1216 void CORE_sgeqp3_init_quark(Quark *quark);
1217 void CORE_sgeqp3_larfg_quark(Quark *quark);
1218 void CORE_sgeqp3_norms_quark(Quark *quark);
1219 void CORE_sgeqp3_pivot_quark(Quark *quark);
1220 void CORE_sgeqp3_tntpiv_quark(Quark *quark);
1221 void CORE_sgeqp3_update_quark(Quark *quark);
1222 void CORE_sgeqrt_quark(Quark *quark);
1223 void CORE_sgessm_quark(Quark *quark);
1224 void CORE_sgessq_quark(Quark *quark);
1225 void CORE_sgessq_f1_quark(Quark *quark);
1226 void CORE_sgetrf_quark(Quark *quark);
1227 void CORE_sgetrf_incpiv_quark(Quark *quark);
1228 void CORE_sgetrf_nopiv_quark(Quark* quark);
1229 void CORE_sgetrf_reclap_quark(Quark *quark);
1230 void CORE_sgetrf_rectil_quark(Quark* quark);
1231 void CORE_sgetrip_quark(Quark *quark);
1232 void CORE_sgetrip_f1_quark(Quark *quark);
1233 void CORE_sgetrip_f2_quark(Quark *quark);
1235 void CORE_ssymm_quark(Quark *quark);
1236 void CORE_ssyrk_quark(Quark *quark);
1237 void CORE_ssyr2k_quark(Quark *quark);
1239 void CORE_ssygst_quark(Quark *quark);
1240 void CORE_ssyrfb_quark(Quark *quark);
1241 void CORE_shessq_quark(Quark *quark);
1242 void CORE_shessq_f1_quark(Quark *quark);
1243 void CORE_slacpy_quark(Quark *quark);
1244 void CORE_slacpy_f1_quark(Quark *quark);
1245 void CORE_slacpy_pivot_quark(Quark *quark);
1246 void CORE_slatro_quark(Quark *quark);
1247 void CORE_slatro_f1_quark(Quark *quark);
1248 void CORE_slange_quark(Quark *quark);
1249 void CORE_slange_f1_quark(Quark *quark);
1251 void CORE_slansy_quark(Quark *quark);
1252 void CORE_slansy_f1_quark(Quark *quark);
1254 void CORE_slansy_quark(Quark *quark);
1255 void CORE_slansy_f1_quark(Quark *quark);
1256 void CORE_slaset_quark(Quark *quark);
1257 void CORE_slaset2_quark(Quark *quark);
1258 void CORE_slatro_quark(Quark *quark);
1259 void CORE_slauum_quark(Quark *quark);
1260 void CORE_spamm_quark(Quark *quark);
1261 void CORE_splgsy_quark(Quark *quark);
1262 void CORE_splgsy_quark(Quark *quark);
1263 void CORE_splrnt_quark(Quark *quark);
1264 void CORE_spltmg_quark(Quark *quark);
1265 void CORE_splssq_quark(Quark *quark);
1266 void CORE_spotrf_quark(Quark *quark);
1267 void CORE_ssetvar_quark(Quark *quark);
1268 void CORE_sshift_quark(Quark *quark);
1269 void CORE_sshiftw_quark(Quark *quark);
1270 void CORE_sssssm_quark(Quark *quark);
1271 void CORE_ssymm_quark(Quark *quark);
1272 void CORE_ssyrk_quark(Quark *quark);
1273 void CORE_ssyr2k_quark(Quark *quark);
1274 void CORE_ssyssq_quark(Quark *quark);
1275 void CORE_ssyssq_f1_quark(Quark *quark);
1276 void CORE_sswpab_quark(Quark *quark);
1277 void CORE_sswptr_ontile_quark(Quark *quark);
1278 void CORE_strdalg1_quark(Quark *quark);
1279 void CORE_strmm_quark(Quark *quark);
1280 void CORE_strsm_quark(Quark *quark);
1281 void CORE_strtri_quark(Quark *quark);
1282 void CORE_stslqt_quark(Quark *quark);
1283 void CORE_stsmlq_quark(Quark *quark);
1284 void CORE_stsmlq_sytra1_quark(Quark *quark);
1285 void CORE_stsmlq_corner_quark(Quark *quark);
1286 void CORE_stsmqr_quark(Quark *quark);
1287 void CORE_stsmqr_sytra1_quark(Quark *quark);
1288 void CORE_stsmqr_corner_quark(Quark *quark);
1289 void CORE_stsqrt_quark(Quark *quark);
1290 void CORE_ststrf_quark(Quark *quark);
1291 void CORE_sttmqr_quark(Quark *quark);
1292 void CORE_sttqrt_quark(Quark *quark);
1293 void CORE_sttmlq_quark(Quark *quark);
1294 void CORE_sttlqt_quark(Quark *quark);
1295 void CORE_sormlq_quark(Quark *quark);
1296 void CORE_sormqr_quark(Quark *quark);
1297 void CORE_slaswp_quark(Quark* quark);
1298 void CORE_slaswp_f2_quark(Quark* quark);
1299 void CORE_slaswp_ontile_quark(Quark *quark);
1300 void CORE_slaswp_ontile_f2_quark(Quark *quark);
1301 void CORE_slaswpc_ontile_quark(Quark *quark);
1302 void CORE_strmm_p2_quark(Quark* quark);
1303 void CORE_sgemm_f2_quark(Quark* quark);
1304 void CORE_sgemm_p2_quark(Quark* quark);
1305 void CORE_sgemm_p2f1_quark(Quark* quark);
1306 void CORE_sgemm_p3_quark(Quark* quark);
void CORE_slaed0_betaapprox(int subpbs, const int *subpbs_info, float *D, const float *E)
Definition: core_slaed0_betaapprox.c:49
int CORE_sttqrt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sttqrt.c:116
int CORE_stsmlq(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_stsmlq.c:124
int CORE_sgetf2_nopiv(int m, int n, float *A, int lda)
Definition: core_sgetf2_nopiv.c:64
void CORE_spotrf(PLASMA_enum uplo, int N, float *A, int LDA, int *INFO)
Definition: core_spotrf.c:68
int CORE_slarfx2c(PLASMA_enum uplo, float V, float TAU, float *C1, float *C2, float *C3)
Definition: core_slarfx_tbrd.c:177
void CORE_slaed3_computeW(int n, int K, const float *Q, int LDQ, const float *DLAMBDA, float *W, const int *INDX, int start, int end)
Definition: core_slaed3_computeW.c:66
int CORE_sswptr_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc, const float *Akk, int ldak)
Definition: core_slaswp.c:224
void CORE_sgbtype1cb(PLASMA_enum uplo, int N, int NB, float *A, int LDA, float *VQ, float *TAUQ, float *VP, float *TAUP, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_sgbtype1cb.c:124
void CORE_strsm(PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag, int M, int N, float alpha, const float *A, int LDA, float *B, int LDB)
Definition: core_strsm.c:80
int CORE_sttmlq(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_sttmlq.c:116
int CORE_spltmg_chebvand(int M, int N, float *A, int LDA, int gN, int m0, int n0, float *W)
Definition: core_spltmg_chebvand.c:83
int CORE_spamm(int op, PLASMA_enum side, PLASMA_enum storev, int M, int N, int K, int L, const float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, float *W, int LDW)
Definition: core_spamm.c:175
void CORE_ssyrk(PLASMA_enum uplo, PLASMA_enum trans, int N, int K, float alpha, const float *A, int LDA, float beta, float *C, int LDC)
Definition: core_ssyrk.c:80
void CORE_ssbtype2cb(int N, int NB, float *A, int LDA, float *V, float *TAU, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_ssbtype2cb.c:104
void CORE_sgeqp3_larfg(PLASMA_desc A, int ii, int jj, int i, int j, float *tau, float *beta)
Definition: core_sgeqp3_larfg.c:78
int CORE_shbrce(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_shbrce.c:78
void CORE_sswap(int m, int n, float *Q, int ldq, const float *work, const int *perm, int start, int end)
Definition: core_sswap.c:67
void CORE_slaed2_copydef(int n, int n1, int K, const int *ctot, float *Q, int LDQ, const float *Q2, int start, int end)
Definition: core_slaed2_compressq.c:180
void CORE_slaed3_merge(int n, int K, float *D, int *INDXQ)
Definition: core_slaed3_merge.c:46
int CORE_spltmg(PLASMA_enum mtxtype, int m, int n, float *A, int lda, int gM, int gN, int m0, int n0, unsigned long long int seed)
Definition: core_spltmg.c:90
int CORE_slaswp_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc)
Definition: core_slaswp.c:107
void CORE_slaset(PLASMA_enum uplo, int n1, int n2, float alpha, float beta, float *tileA, int ldtilea)
Definition: core_slaset.c:57
int CORE_ssyrfb(PLASMA_enum uplo, int N, int K, int IB, int NB, const float *A, int LDA, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_ssyrfb.c:110
int CORE_sgessm(int M, int N, int K, int IB, const int *IPIV, const float *L, int LDL, float *A, int LDA)
Definition: core_sgessm.c:70
int CORE_shblrx(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_shblrx.c:78
int CORE_slarfx2(PLASMA_enum side, int N, float V, float TAU, float *C1, int LDC1, float *C2, int LDC2)
Definition: core_slarfx_tbrd.c:82
void CORE_sgeqp3_pivot(PLASMA_desc A, float *F, int ldf, int jj, int k, int *jpvt, float *norms1, float *norms2, int *info)
Definition: core_sgeqp3_pivot.c:68
void CORE_sshiftw(int s, int cl, int m, int n, int L, float *A, float *W)
Definition: core_sshift.c:66
void CORE_strasm(PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag, int M, int N, const float *A, int lda, float *work)
Definition: core_strasm.c:66
void CORE_spltmg_condexq(int M, int N, float *Q, int LDQ)
Definition: core_spltmg_condex.c:53
void CORE_sgeqp3_update(const float *Ajj, int lda1, float *Ajk, int lda2, const float *Fk, int ldf, int joff, int k, int koff, int nb, float *norms1, float *norms2, int *info)
Definition: core_sgeqp3_update.c:82
int CORE_slag2c(int m, int n, const float *R, int ldr, PLASMA_Complex32_t *Z, int ldz)
Definition: core_slag2c.c:58
void CORE_slaed2_compressq(int n, int n1, const int *INDX, const int *ctot, const float *Q, int LDQ, float *Q2, int start, int end)
Definition: core_slaed2_compressq.c:85
void CORE_sgeqp3_norms(PLASMA_desc A, int ioff, int joff, float *norms1, float *norms2)
Definition: core_sgeqp3_norms.c:62
void CORE_ssygst(int itype, PLASMA_enum uplo, int N, float *A, int LDA, float *B, int LDB, int *INFO)
Definition: core_ssygst.c:80
int CORE_sgetrf_reclap(CORE_sgetrf_data_t *data, int M, int N, float *A, int LDA, int *IPIV, int *info)
Definition: core_sgetrf_reclap.c:123
void CORE_strmm(PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag, int M, int N, float alpha, const float *A, int LDA, float *B, int LDB)
Definition: core_strmm.c:84
void CORE_slantr(PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag, int M, int N, const float *A, int LDA, float *work, float *normA)
Definition: core_slantr.c:86
int CORE_sgetrf_incpiv(int M, int N, int IB, float *A, int LDA, int *IPIV, int *INFO)
Definition: core_sgetrf_incpiv.c:83
int CORE_stsmqr(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_stsmqr.c:124
int CORE_sgetrf_rectil(CORE_sgetrf_data_t *data, const PLASMA_desc A, int *IPIV, int *info)
Definition: core_sgetrf_rectil.c:120
void CORE_sbrdalg1(PLASMA_enum uplo, int n, int nb, float *A, int lda, float *VQ, float *TAUQ, float *VP, float *TAUP, int Vblksiz, int wantz, int i, int sweepid, int m, int grsiz, float *work)
Definition: core_sbrdalg1.c:111
int CORE_sparfb(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev, int M1, int N1, int M2, int N2, int K, int L, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_sparfb.c:132
void CORE_slaed3_updatevectors(int op, int wsmode, int n, int n1, int K, int il_nondef, int iu_nondef, float *Q, int ldq, float *Q2, const int *ctot, float *WORK, int start, int end)
Definition: core_slaed3_updatevectors.c:95
int CORE_stsmqr_corner(int m1, int n1, int m2, int n2, int m3, int n3, int k, int ib, int nb, float *A1, int lda1, float *A2, int lda2, float *A3, int lda3, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmqr_corner.c:130
int CORE_stradd(PLASMA_enum uplo, PLASMA_enum trans, int M, int N, float alpha, const float *A, int LDA, float beta, float *B, int LDB)
Definition: core_stradd.c:86
int CORE_sgbrce(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_sgbrce.c:78
int CORE_stsmlq_corner(int m1, int n1, int m2, int n2, int m3, int n3, int k, int ib, int nb, float *A1, int lda1, float *A2, int lda2, float *A3, int lda3, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmlq_corner.c:130
void CORE_ssbtype1cb(int N, int NB, float *A, int LDA, float *V, float *TAU, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_ssbtype1cb.c:100
int CORE_sttmqr(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_sttmqr.c:116
int CORE_sgeqrt(int M, int N, int IB, float *A, int LDA, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sgeqrt.c:86
void CORE_splrnt(int m, int n, float *A, int lda, int bigM, int m0, int n0, unsigned long long int seed)
Definition: core_splrnt.c:68
void CORE_slauum(PLASMA_enum uplo, int N, float *A, int LDA)
Definition: core_slauum.c:57
void CORE_ssbtype3cb(int N, int NB, float *A, int LDA, const float *V, const float *TAU, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_ssbtype3cb.c:101
void CORE_slange(int norm, int M, int N, const float *A, int LDA, float *work, float *normA)
Definition: core_slange.c:72
int CORE_slatro(PLASMA_enum uplo, PLASMA_enum trans, int M, int N, const float *A, int LDA, float *B, int LDB)
Definition: core_slatro.c:80
void CORE_strdalg1(int n, int nb, float *A, int lda, float *V, float *TAU, int Vblksiz, int wantz, int i, int sweepid, int m, int grsiz, float *work)
Definition: core_strdalg1.c:91
Definition: core_sgetrf_reclap.c:24
int CORE_slarfx2ce(PLASMA_enum uplo, float *V, float *TAU, float *C1, float *C2, float *C3)
Definition: core_slarfx_tbrd.c:323
int CORE_sgbelr(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_sgbelr.c:81
int CORE_stsmqr_sytra1(PLASMA_enum side, PLASMA_enum trans, int m1, int n1, int m2, int n2, int k, int ib, float *A1, int lda1, float *A2, int lda2, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmqr_sytra1.c:127
int CORE_slacpy_pivot(const PLASMA_desc descA, PLASMA_enum direct, int k1, int k2, const int *ipiv, int *rankin, int *rankout, float *A, int lda, int init)
Definition: core_slacpy_pivot.c:84
int CORE_spltmg_hankel(PLASMA_enum uplo, int M, int N, float *A, int LDA, int m0, int n0, int nb, const float *V1, const float *V2)
Definition: core_spltmg_hankel.c:88
void CORE_sgemm(PLASMA_enum transA, PLASMA_enum transB, int M, int N, int K, float alpha, const float *A, int LDA, const float *B, int LDB, float beta, float *C, int LDC)
Definition: core_sgemm.c:90
int CORE_sormqr(PLASMA_enum side, PLASMA_enum trans, int M, int N, int K, int IB, const float *V, int LDV, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_sormqr.c:108
void CORE_slaset2(PLASMA_enum uplo, int n1, int n2, float alpha, float *tileA, int ldtilea)
Definition: core_slaset2.c:55
int CORE_stslqt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_stslqt.c:107
void CORE_slarfy(int N, float *A, int LDA, const float *V, const float *TAU, float *WORK)
Definition: core_slarfy.c:61
int CORE_sgetrf_nopiv(int m, int n, int ib, float *A, int lda)
Definition: core_sgetrf_nopiv.c:69
void CORE_slaed3_reduceW(int n, int n1, int K, int l, const float *Q, int LDQ, const float *Wred, float *W)
Definition: core_slaed3_reduceW.c:60
void CORE_slaed2_computeK(int *K, int n, int n1, float *beta, float *D, float *Q, int LDQ, float *Z, float *DLAMBDA, float *W, int *INDX, int *INDXC, int *INDXP, int *INDXQ, int *COLTYP)
Definition: core_slaed2_computeK.c:104
void CORE_sgetrip(int m, int n, float *A, float *work)
Definition: core_sgetrip.c:51
int CORE_shbelr(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_shbelr.c:80
void CORE_spltmg_toeppd1(int gM, int m0, int M, float *W, unsigned long long int seed)
Definition: core_spltmg_toeppd.c:70
int CORE_sormlq(PLASMA_enum side, PLASMA_enum trans, int M, int N, int IB, int K, const float *V, int LDV, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_sormlq.c:108
int CORE_slascl(PLASMA_enum type, int kl, int ku, float cfrom, float cto, int m, int n, float *A, int lda)
Definition: core_slascl.c:77
int CORE_sttlqt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sttlqt.c:116
void CORE_splgsy(float bump, int m, int n, float *A, int lda, int bigM, int m0, int n0, unsigned long long int seed)
Definition: core_splgsy.c:72
void CORE_sgemv(PLASMA_enum trans, int M, int N, float alpha, const float *A, int LDA, const float *x, int incx, float beta, float *y, int incy)
Definition: core_sgemv.c:78
int CORE_slarfb_gemm(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev, int M, int N, int K, const float *V, int LDV, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_slarfb_gemm.c:113
void CORE_ssetvar(const float *alpha, float *x)
Definition: core_ssetvar.c:37
int CORE_stsmlq_sytra1(PLASMA_enum side, PLASMA_enum trans, int m1, int n1, int m2, int n2, int k, int ib, float *A1, int lda1, float *A2, int lda2, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmlq_sytra1.c:125
int CORE_slaswpc_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc)
Definition: core_slaswp.c:296
int CORE_spemv(PLASMA_enum trans, PLASMA_enum storev, int M, int N, int L, float ALPHA, const float *A, int LDA, const float *X, int INCX, float BETA, float *Y, int INCY, float *WORK)
Definition: core_spemv.c:118
int CORE_sgelqt(int M, int N, int IB, float *A, int LDA, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sgelqt.c:85
void CORE_sgbtype2cb(PLASMA_enum uplo, int N, int NB, float *A, int LDA, float *VQ, float *TAUQ, float *VP, float *TAUP, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_sgbtype2cb.c:129
int CORE_slaed4(int n, int K, float *D, float beta, float *Q, int LDQ, const float *D0, const float *Z, const int *INDX, int start, int end)
Definition: core_slaed4.c:75
int CORE_sstedc(PLASMA_enum compz, int n, float *D, float *E, float *Z, int LDZ, float *WORK, int LWORK, int *IWORK, int LIWORK)
Definition: core_sstedc.c:85
void CORE_slaswp(int N, float *A, int LDA, int I1, int I2, const int *IPIV, int INC)
Definition: core_slaswp.c:62
int CORE_stsqrt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_stsqrt.c:97
void CORE_strtri(PLASMA_enum uplo, PLASMA_enum diag, int N, float *A, int LDA, int *info)
Definition: core_strtri.c:66
void CORE_ssymm(PLASMA_enum side, PLASMA_enum uplo, int M, int N, float alpha, const float *A, int LDA, const float *B, int LDB, float beta, float *C, int LDC)
Definition: core_ssymm.c:88
void CORE_sasum(int storev, PLASMA_enum uplo, int M, int N, const float *A, int lda, float *work)
Definition: core_sasum.c:61
int CORE_sssssm(int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *L1, int LDL1, const float *L2, int LDL2, const int *IPIV)
Definition: core_sssssm.c:94
void CORE_slaed3_computevectors(int K, int il_nondef, int iu_nondef, float *Q, int LDQ, float *W, float *S, const int *INDXC, int start, int end)
Definition: core_slaed3_computevectors.c:74
void CORE_slacpy(PLASMA_enum uplo, int M, int N, const float *A, int LDA, float *B, int LDB)
Definition: core_slacpy.c:59
Definition: descriptor.h:41
void CORE_spltmg_fiedler(int m, int n, const float *X, int incX, const float *Y, int incY, float *A, int lda)
Definition: core_spltmg_fiedler.c:75
void CORE_slansy(int norm, PLASMA_enum uplo, int N, const float *A, int LDA, float *work, float *normA)
Definition: core_slansy.c:74
void CORE_spltmg_toeppd2(int M, int N, int K, int m0, int n0, const float *W, float *A, int LDA)
Definition: core_spltmg_toeppd.c:149
int CORE_spltmg_circul(int M, int N, float *A, int LDA, int gM, int m0, int n0, const float *V)
Definition: core_spltmg_circul.c:76
int CORE_sgblrx(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_sgblrx.c:80
void CORE_sswpab(int i, int n1, int n2, float *A, float *work)
Definition: core_sswpab.c:63
int CORE_slascal(PLASMA_enum uplo, int m, int n, float alpha, float *A, int lda)
Definition: core_slascal.c:52
int CORE_sgeadd(PLASMA_enum trans, int M, int N, float alpha, const float *A, int LDA, float beta, float *B, int LDB)
Definition: core_sgeadd.c:75
int CORE_ststrf(int M, int N, int IB, int NB, float *U, int LDU, float *A, int LDA, float *L, int LDL, int *IPIV, float *WORK, int LDWORK, int *INFO)
Definition: core_ststrf.c:99
void CORE_sgeqp3_init(int n, int *jpvt)
Definition: core_sgeqp3_init.c:38
int CORE_ssteqr(PLASMA_enum compz, int n, float *D, float *E, float *Z, int LDZ, float *WORK)
Definition: core_ssteqr.c:66
void CORE_ssyr2k(PLASMA_enum uplo, PLASMA_enum trans, int N, int K, float alpha, const float *A, int LDA, const float *B, int LDB, float beta, float *C, int LDC)
Definition: core_ssyr2k.c:90
void CORE_sgbtype3cb(PLASMA_enum uplo, int N, int NB, float *A, int LDA, float *VQ, float *TAUQ, float *VP, float *TAUP, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_sgbtype3cb.c:124
int CORE_sgetrf(int M, int N, float *A, int LDA, int *IPIV, int *INFO)
Definition: core_sgetrf.c:60