PLASMA  2.8.0
PLASMA - Parallel Linear Algebra for Scalable Multi-core Architectures
core_sblas.h
1 
18 #ifndef _PLASMA_CORE_SBLAS_H_
19 #define _PLASMA_CORE_SBLAS_H_
20 
21 #define REAL
22 
23 #ifdef __cplusplus
24 extern "C" {
25 #endif
26 
27 struct CORE_sgetrf_data_s;
29 
33 void CORE_sasum(int storev, PLASMA_enum uplo, int M, int N,
34  const float *A, int lda, float *work);
35 void CORE_sbrdalg1( PLASMA_enum uplo,
36  int n,
37  int nb,
38  float *A,
39  int lda,
40  float *VQ,
41  float *TAUQ,
42  float *VP,
43  float *TAUP,
44  int Vblksiz, int wantz,
45  int i, int sweepid, int m, int grsiz,
46  float *work);
47 int CORE_sgbelr(PLASMA_enum uplo, int N,
48  PLASMA_desc *A, float *V, float *TAU,
49  int st, int ed, int eltsize);
50 int CORE_sgbrce(PLASMA_enum uplo, int N,
51  PLASMA_desc *A, float *V, float *TAU,
52  int st, int ed, int eltsize);
53 int CORE_sgblrx(PLASMA_enum uplo, int N,
54  PLASMA_desc *A, float *V, float *TAU,
55  int st, int ed, int eltsize);
56 int CORE_sgeadd(PLASMA_enum trans, int M, int N,
57  float alpha,
58  const float *A, int LDA,
59  float beta,
60  float *B, int LDB);
61 int CORE_sgelqt(int M, int N, int IB,
62  float *A, int LDA,
63  float *T, int LDT,
64  float *TAU,
65  float *WORK);
66 void CORE_sgemm(PLASMA_enum transA, PLASMA_enum transB,
67  int M, int N, int K,
68  float alpha, const float *A, int LDA,
69  const float *B, int LDB,
70  float beta, float *C, int LDC);
71 void CORE_sgemv(PLASMA_enum trans, int M, int N,
72  float alpha, const float *A, int LDA,
73  const float *x, int incx,
74  float beta, float *y, int incy);
75 void CORE_sgeqp3_init( int n, int *jpvt );
76 void CORE_sgeqp3_larfg( PLASMA_desc A, int ii, int jj, int i, int j,
77  float *tau, float *beta );
78 void CORE_sgeqp3_norms( PLASMA_desc A, int ioff, int joff, float *norms1, float *norms2 );
79 void CORE_sgeqp3_pivot( PLASMA_desc A, float *F, int ldf,
80  int jj, int k, int *jpvt,
81  float *norms1, float *norms2, int *info );
82 int CORE_sgeqp3_tntpiv(int m, int n,
83  float *A, int lda,
84  int *IPIV, float *tau,
85  int *iwork);
86 void CORE_sgeqp3_update( const float *Ajj, int lda1,
87  float *Ajk, int lda2,
88  const float *Fk, int ldf,
89  int joff, int k, int koff, int nb,
90  float *norms1, float *norms2,
91  int *info );
92 int CORE_sgeqrt(int M, int N, int IB,
93  float *A, int LDA,
94  float *T, int LDT,
95  float *TAU, float *WORK);
96 int CORE_sgessm(int M, int N, int K, int IB,
97  const int *IPIV,
98  const float *L, int LDL,
99  float *A, int LDA);
100 int CORE_sgessq(int M, int N,
101  const float *A, int LDA,
102  float *scale, float *sumsq);
103 int CORE_sgetf2_nopiv(int m, int n,
104  float *A, int lda);
105 int CORE_sgetrf(int M, int N,
106  float *A, int LDA,
107  int *IPIV, int *INFO);
108 int CORE_sgetrf_incpiv(int M, int N, int IB,
109  float *A, int LDA,
110  int *IPIV, int *INFO);
111 int CORE_sgetrf_nopiv(int m, int n, int ib,
112  float *A, int lda);
113 int CORE_sgetrf_reclap(CORE_sgetrf_data_t *data, int M, int N,
114  float *A, int LDA,
115  int *IPIV, int *info);
116 CORE_sgetrf_data_t *CORE_sgetrf_reclap_init(int nbthrd);
117 int CORE_sgetrf_rectil(CORE_sgetrf_data_t *data, const PLASMA_desc A, int *IPIV, int *info);
118 CORE_sgetrf_data_t *CORE_sgetrf_rectil_init(int nbthrd);
119 void CORE_sgetrip(int m, int n, float *A,
120  float *work);
121 int CORE_shbelr(PLASMA_enum uplo, int N,
122  PLASMA_desc *A, float *V, float *TAU,
123  int st, int ed, int eltsize);
124 int CORE_shblrx(PLASMA_enum uplo, int N,
125  PLASMA_desc *A, float *V, float *TAU,
126  int st, int ed, int eltsize);
127 int CORE_shbrce(PLASMA_enum uplo, int N,
128  PLASMA_desc *A, float *V, float *TAU,
129  int st, int ed, int eltsize);
130 void CORE_ssbtype1cb(int N, int NB,
131  float *A, int LDA,
132  float *V, float *TAU,
133  int st, int ed, int sweep, int Vblksiz, int WANTZ,
134  float *WORK);
135 void CORE_ssbtype2cb(int N, int NB,
136  float *A, int LDA,
137  float *V, float *TAU,
138  int st, int ed, int sweep, int Vblksiz, int WANTZ,
139  float *WORK);
140 void CORE_ssbtype3cb(int N, int NB,
141  float *A, int LDA,
142  const float *V, const float *TAU,
143  int st, int ed, int sweep, int Vblksiz, int WANTZ,
144  float *WORK);
145 void CORE_sgbtype1cb(PLASMA_enum uplo, int N, int NB,
146  float *A, int LDA,
147  float *VQ, float *TAUQ,
148  float *VP, float *TAUP,
149  int st, int ed, int sweep, int Vblksiz, int WANTZ,
150  float *WORK);
151 void CORE_sgbtype2cb(PLASMA_enum uplo, int N, int NB,
152  float *A, int LDA,
153  float *VQ, float *TAUQ,
154  float *VP, float *TAUP,
155  int st, int ed, int sweep, int Vblksiz, int WANTZ,
156  float *WORK);
157 void CORE_sgbtype3cb(PLASMA_enum uplo, int N, int NB,
158  float *A, int LDA,
159  float *VQ, float *TAUQ,
160  float *VP, float *TAUP,
161  int st, int ed, int sweep, int Vblksiz, int WANTZ,
162  float *WORK);
163 void CORE_ssygst(int itype, PLASMA_enum uplo, int N,
164  float *A, int LDA,
165  float *B, int LDB, int *INFO);
166 #ifdef COMPLEX
167 void CORE_ssymm(PLASMA_enum side, PLASMA_enum uplo,
168  int M, int N,
169  float alpha, const float *A, int LDA,
170  const float *B, int LDB,
171  float beta, float *C, int LDC);
172 void CORE_ssyrk(PLASMA_enum uplo, PLASMA_enum trans,
173  int N, int K,
174  float alpha, const float *A, int LDA,
175  float beta, float *C, int LDC);
176 void CORE_ssyr2k(PLASMA_enum uplo, PLASMA_enum trans,
177  int N, int K,
178  float alpha, const float *A, int LDA,
179  const float *B, int LDB,
180  float beta, float *C, int LDC);
181 int CORE_shessq(PLASMA_enum uplo, int N,
182  const float *A, int LDA,
183  float *scale, float *sumsq);
184 #endif
185 int CORE_ssyrfb(PLASMA_enum uplo, int N, int K, int IB, int NB,
186  const float *A, int LDA,
187  const float *T, int LDT,
188  float *C, int LDC,
189  float *WORK, int LDWORK);
190 void CORE_slacpy(PLASMA_enum uplo, int M, int N,
191  const float *A, int LDA,
192  float *B, int LDB);
193 int CORE_slacpy_pivot( const PLASMA_desc descA,
194  PLASMA_enum direct,
195  int k1, int k2, const int *ipiv,
196  int *rankin, int *rankout,
197  float *A, int lda,
198  int init);
199 void CORE_slange(int norm, int M, int N,
200  const float *A, int LDA,
201  float *work, float *normA);
202 #ifdef COMPLEX
203 void CORE_slansy(int norm, PLASMA_enum uplo, int N,
204  const float *A, int LDA,
205  float *work, float *normA);
206 #endif
207 void CORE_slansy(int norm, PLASMA_enum uplo, int N,
208  const float *A, int LDA,
209  float *work, float *normA);
210 void CORE_slantr(PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag,
211  int M, int N,
212  const float *A, int LDA,
213  float *work, float *normA);
214 int CORE_slarfb_gemm(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev,
215  int M, int N, int K,
216  const float *V, int LDV,
217  const float *T, int LDT,
218  float *C, int LDC,
219  float *WORK, int LDWORK);
220 int CORE_slarfx2(PLASMA_enum side, int N,
221  float V,
222  float TAU,
223  float *C1, int LDC1,
224  float *C2, int LDC2);
225 int CORE_slarfx2c(PLASMA_enum uplo,
226  float V,
227  float TAU,
228  float *C1,
229  float *C2,
230  float *C3);
231 int CORE_slarfx2ce(PLASMA_enum uplo,
232  float *V,
233  float *TAU,
234  float *C1,
235  float *C2,
236  float *C3);
237 void CORE_slarfy(int N,
238  float *A, int LDA,
239  const float *V,
240  const float *TAU,
241  float *WORK);
242 int CORE_slascal(PLASMA_enum uplo, int m, int n,
243  float alpha, float *A, int lda);
244 void CORE_slaset(PLASMA_enum uplo, int n1, int n2,
245  float alpha, float beta,
246  float *tileA, int ldtilea);
247 void CORE_slaset2(PLASMA_enum uplo, int n1, int n2, float alpha,
248  float *tileA, int ldtilea);
249 void CORE_slaswp(int N, float *A, int LDA,
250  int I1, int I2, const int *IPIV, int INC);
251 int CORE_slaswp_ontile( PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc);
252 int CORE_slaswpc_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc);
253 int CORE_slatro(PLASMA_enum uplo, PLASMA_enum trans,
254  int M, int N,
255  const float *A, int LDA,
256  float *B, int LDB);
257 void CORE_slauum(PLASMA_enum uplo, int N, float *A, int LDA);
258 int CORE_spamm(int op, PLASMA_enum side, PLASMA_enum storev,
259  int M, int N, int K, int L,
260  const float *A1, int LDA1,
261  float *A2, int LDA2,
262  const float *V, int LDV,
263  float *W, int LDW);
264 int CORE_sparfb(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev,
265  int M1, int N1, int M2, int N2, int K, int L,
266  float *A1, int LDA1,
267  float *A2, int LDA2,
268  const float *V, int LDV,
269  const float *T, int LDT,
270  float *WORK, int LDWORK);
271 int CORE_spemv(PLASMA_enum trans, PLASMA_enum storev,
272  int M, int N, int L,
273  float ALPHA,
274  const float *A, int LDA,
275  const float *X, int INCX,
276  float BETA,
277  float *Y, int INCY,
278  float *WORK);
279 void CORE_splgsy(float bump, int m, int n, float *A, int lda,
280  int bigM, int m0, int n0, unsigned long long int seed );
281 void CORE_splgsy(float bump, int m, int n, float *A, int lda,
282  int bigM, int m0, int n0, unsigned long long int seed );
283 void CORE_splrnt(int m, int n, float *A, int lda,
284  int bigM, int m0, int n0, unsigned long long int seed );
285 int CORE_spltmg(PLASMA_enum mtxtype, int m, int n, float *A, int lda,
286  int gM, int gN, int m0, int n0, unsigned long long int seed );
287 int CORE_spltmg_chebvand( int M, int N, float *A, int LDA,
288  int gN, int m0, int n0,
289  float *W );
290 int CORE_spltmg_circul( int M, int N, float *A, int LDA,
291  int gM, int m0, int n0,
292  const float *V );
293 void CORE_spltmg_condexq( int M, int N, float *Q, int LDQ );
294 void CORE_spltmg_fiedler(int m, int n,
295  const float *X, int incX,
296  const float *Y, int incY,
297  float *A, int lda);
298 int CORE_spltmg_hankel( PLASMA_enum uplo, int M, int N, float *A, int LDA,
299  int m0, int n0, int nb,
300  const float *V1,
301  const float *V2 );
302 void CORE_spltmg_toeppd1( int gM, int m0, int M, float *W,
303  unsigned long long int seed );
304 void CORE_spltmg_toeppd2( int M, int N, int K, int m0, int n0,
305  const float *W,
306  float *A, int LDA );
307 void CORE_spotrf(PLASMA_enum uplo, int N, float *A, int LDA, int *INFO);
308 void CORE_ssetvar(const float *alpha, float *x);
309 void CORE_sshift(int s, int m, int n, int L,
310  float *A);
311 void CORE_sshiftw(int s, int cl, int m, int n, int L,
312  float *A, float *W);
313 int CORE_sssssm(int M1, int N1, int M2, int N2, int K, int IB,
314  float *A1, int LDA1,
315  float *A2, int LDA2,
316  const float *L1, int LDL1,
317  const float *L2, int LDL2,
318  const int *IPIV);
319 int CORE_sstedc(PLASMA_enum compz, int n,
320  float *D, float *E,
321  float *Z, int LDZ,
322  float *WORK, int LWORK,
323 #ifdef COMPLEX
324  float *RWORK, int LRWORK,
325 #endif
326  int *IWORK, int LIWORK);
327 int CORE_ssteqr(PLASMA_enum compz, int n,
328  float *D, float *E,
329  float *Z, int LDZ,
330  float *WORK);
331 void CORE_ssymm(PLASMA_enum side, PLASMA_enum uplo,
332  int M, int N,
333  float alpha, const float *A, int LDA,
334  const float *B, int LDB,
335  float beta, float *C, int LDC);
336 void CORE_ssyrk(PLASMA_enum uplo, PLASMA_enum trans,
337  int N, int K,
338  float alpha, const float *A, int LDA,
339  float beta, float *C, int LDC);
340 void CORE_ssyr2k(PLASMA_enum uplo, PLASMA_enum trans,
341  int N, int K,
342  float alpha, const float *A, int LDA,
343  const float *B, int LDB,
344  float beta, float *C, int LDC);
345 int CORE_ssyssq(PLASMA_enum uplo, int N,
346  const float *A, int LDA,
347  float *scale, float *sumsq);
348 void CORE_sswpab(int i, int n1, int n2,
349  float *A, float *work);
350 int CORE_sswptr_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc,
351  const float *Akk, int ldak);
352 int CORE_stradd(PLASMA_enum uplo, PLASMA_enum trans, int M, int N,
353  float alpha,
354  const float *A, int LDA,
355  float beta,
356  float *B, int LDB);
357 void CORE_strasm(PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag,
358  int M, int N, const float *A, int lda, float *work);
359 void CORE_strdalg1(int n,
360  int nb,
361  float *A,
362  int lda,
363  float *V,
364  float *TAU,
365  int Vblksiz, int wantz,
366  int i, int sweepid, int m, int grsiz,
367  float *work);
368 void CORE_strmm(PLASMA_enum side, PLASMA_enum uplo,
369  PLASMA_enum transA, PLASMA_enum diag,
370  int M, int N,
371  float alpha, const float *A, int LDA,
372  float *B, int LDB);
373 void CORE_strsm(PLASMA_enum side, PLASMA_enum uplo,
374  PLASMA_enum transA, PLASMA_enum diag,
375  int M, int N,
376  float alpha, const float *A, int LDA,
377  float *B, int LDB);
378 int CORE_strssq(PLASMA_enum uplo, PLASMA_enum diag, int M, int N,
379  const float *A, int LDA,
380  float *scale, float *sumsq);
381 void CORE_strtri(PLASMA_enum uplo, PLASMA_enum diag, int N,
382  float *A, int LDA, int *info);
383 int CORE_stslqt(int M, int N, int IB,
384  float *A1, int LDA1,
385  float *A2, int LDA2,
386  float *T, int LDT,
387  float *TAU, float *WORK);
388 int CORE_stsmlq(PLASMA_enum side, PLASMA_enum trans,
389  int M1, int N1, int M2, int N2, int K, int IB,
390  float *A1, int LDA1,
391  float *A2, int LDA2,
392  const float *V, int LDV,
393  const float *T, int LDT,
394  float *WORK, int LDWORK);
395 int CORE_stsmlq_corner( int m1, int n1, int m2, int n2, int m3, int n3,
396  int k, int ib, int nb,
397  float *A1, int lda1,
398  float *A2, int lda2,
399  float *A3, int lda3,
400  const float *V, int ldv,
401  const float *T, int ldt,
402  float *WORK, int ldwork);
403 int CORE_stsmlq_sytra1( PLASMA_enum side, PLASMA_enum trans,
404  int m1, int n1, int m2, int n2,
405  int k, int ib,
406  float *A1, int lda1,
407  float *A2, int lda2,
408  const float *V, int ldv,
409  const float *T, int ldt,
410  float *WORK, int ldwork);
411 int CORE_stsmqr(PLASMA_enum side, PLASMA_enum trans,
412  int M1, int N1, int M2, int N2, int K, int IB,
413  float *A1, int LDA1,
414  float *A2, int LDA2,
415  const float *V, int LDV,
416  const float *T, int LDT,
417  float *WORK, int LDWORK);
418 int CORE_stsmqr_corner( int m1, int n1, int m2, int n2, int m3, int n3,
419  int k, int ib, int nb,
420  float *A1, int lda1,
421  float *A2, int lda2,
422  float *A3, int lda3,
423  const float *V, int ldv,
424  const float *T, int ldt,
425  float *WORK, int ldwork);
426 int CORE_stsmqr_sytra1( PLASMA_enum side, PLASMA_enum trans,
427  int m1, int n1, int m2, int n2,
428  int k, int ib,
429  float *A1, int lda1,
430  float *A2, int lda2,
431  const float *V, int ldv,
432  const float *T, int ldt,
433  float *WORK, int ldwork);
434 int CORE_stsqrt(int M, int N, int IB,
435  float *A1, int LDA1,
436  float *A2, int LDA2,
437  float *T, int LDT,
438  float *TAU, float *WORK);
439 int CORE_ststrf(int M, int N, int IB, int NB,
440  float *U, int LDU,
441  float *A, int LDA,
442  float *L, int LDL,
443  int *IPIV, float *WORK,
444  int LDWORK, int *INFO);
445 int CORE_sttmqr(PLASMA_enum side, PLASMA_enum trans,
446  int M1, int N1, int M2, int N2, int K, int IB,
447  float *A1, int LDA1,
448  float *A2, int LDA2,
449  const float *V, int LDV,
450  const float *T, int LDT,
451  float *WORK, int LDWORK);
452 int CORE_sttqrt(int M, int N, int IB,
453  float *A1, int LDA1,
454  float *A2, int LDA2,
455  float *T, int LDT,
456  float *TAU,
457  float *WORK);
458 int CORE_sttmlq(PLASMA_enum side, PLASMA_enum trans,
459  int M1, int N1, int M2, int N2, int K, int IB,
460  float *A1, int LDA1,
461  float *A2, int LDA2,
462  const float *V, int LDV,
463  const float *T, int LDT,
464  float *WORK, int LDWORK);
465 int CORE_sttlqt(int M, int N, int IB,
466  float *A1, int LDA1,
467  float *A2, int LDA2,
468  float *T, int LDT,
469  float *TAU,
470  float *WORK);
471 int CORE_sormlq(PLASMA_enum side, PLASMA_enum trans,
472  int M, int N, int IB, int K,
473  const float *V, int LDV,
474  const float *T, int LDT,
475  float *C, int LDC,
476  float *WORK, int LDWORK);
477 int CORE_sormqr(PLASMA_enum side, PLASMA_enum trans,
478  int M, int N, int K, int IB,
479  const float *V, int LDV,
480  const float *T, int LDT,
481  float *C, int LDC,
482  float *WORK, int LDWORK);
483 
484 #ifndef COMPLEX
485 void CORE_slaed2_computeK(int *K, int n, int n1,
486  float *beta, float *D, float *Q, int LDQ,
487  float *Z, float *DLAMBDA, float *W,
488  int *INDX, int *INDXC, int *INDXP, int *INDXQ,
489  int *COLTYP);
490 void CORE_slaed2_compressq(int n, int n1, const int *INDX, const int *ctot,
491  const float *Q, int LDQ, float *Q2,
492  int start, int end);
493 void CORE_slaed2_copydef(int n, int n1, int K, const int *ctot,
494  float *Q, int LDQ, const float *Q2,
495  int start, int end);
496 int CORE_slaed4(int n, int K,
497  float *D, float beta,
498  float *Q, int LDQ,
499  const float *D0, const float *Z,
500  const int *INDX,
501  int start, int end );
502 void CORE_slaed3_computeW(int n, int K,
503  const float *Q, int LDQ,
504  const float *DLAMBDA, float *W,
505  const int *INDX,
506  int start, int end);
507 void CORE_slaed3_reduceW(int n, int n1, int K, int l,
508  const float *Q, int LDQ,
509  const float *Wred, float *W);
510 void CORE_slaed3_computevectors(int K, int il_nondef, int iu_nondef,
511  float *Q, int LDQ, float *W, float *S,
512  const int *INDXC,
513  int start, int end);
514 void CORE_slaed3_merge( int n, int K, float *D, int *INDXQ );
515 void CORE_slaed3_updatevectors(int op, int wsmode, int n, int n1, int K,
516  int il_nondef, int iu_nondef,
517  float *Q, int ldq, float *Q2,
518  const int *ctot, float *WORK, int start, int end);
519 #endif
520 void CORE_sswap(int m, int n, float *Q, int ldq,
521  const float *work, const int *perm,
522  int start, int end);
523 int CORE_slascl(PLASMA_enum type, int kl, int ku, float cfrom, float cto,
524  int m, int n, float *A, int lda);
525 #ifdef COMPLEX
526 int CORE_slag2c(int m, int n, const float *Q, int LDQ,
527  float *Z, int LDZ);
528 #endif
529 
530 #ifndef COMPLEX
531 void CORE_slaed3_freebigwork(int oper, float **WORK);
532 void CORE_slaed0_betaapprox(int subpbs, const int *subpbs_info,
533  float *D, const float *E);
534 int CORE_slapst(PLASMA_enum type, int n,
535  const float *D, int *INDX);
536 #endif
537 
538 #if defined(QUARK_H)
539 
542 void QUARK_CORE_sasum(Quark *quark, Quark_Task_Flags *task_flags,
543  PLASMA_enum storev, PLASMA_enum uplo, int m, int n,
544  const float *A, int lda, int szeA,
545  float *work, int szeW);
546 void QUARK_CORE_sasum_f1(Quark *quark, Quark_Task_Flags *task_flags,
547  PLASMA_enum storev, PLASMA_enum uplo, int m, int n,
548  const float *A, int lda, int szeA,
549  float *work, int szeW,
550  float *fake, int szeF);
551 void QUARK_CORE_sgeadd(Quark *quark, Quark_Task_Flags *task_flags,
552  PLASMA_enum trans, int m, int n, int nb,
553  float alpha,
554  const float *A, int lda,
555  float beta,
556  float *B, int ldb);
557 void QUARK_CORE_sbrdalg1(Quark *quark, Quark_Task_Flags *task_flags,
558  PLASMA_enum uplo,
559  int n, int nb,
560  float *A,
561  int lda,
562  float *VQ,
563  float *TAUQ,
564  float *VP,
565  float *TAUP,
566  int Vblksiz, int wantz,
567  int i, int sweepid, int m, int grsiz,
568  int *PCOL, int *ACOL, int *MCOL);
569 void QUARK_CORE_sgelqt(Quark *quark, Quark_Task_Flags *task_flags,
570  int m, int n, int ib, int nb,
571  float *A, int lda,
572  float *T, int ldt);
573 void QUARK_CORE_sgemm(Quark *quark, Quark_Task_Flags *task_flags,
574  PLASMA_enum transA, PLASMA_enum transB,
575  int m, int n, int k, int nb,
576  float alpha, const float *A, int lda,
577  const float *B, int ldb,
578  float beta, float *C, int ldc);
579 void QUARK_CORE_sgemm2( Quark *quark, Quark_Task_Flags *task_flags,
580  PLASMA_enum transA, PLASMA_enum transB,
581  int m, int n, int k, int nb,
582  float alpha, const float *A, int lda,
583  const float *B, int ldb,
584  float beta, float *C, int ldc);
585 void QUARK_CORE_sgemm_f2(Quark *quark, Quark_Task_Flags *task_flags,
586  PLASMA_enum transA, PLASMA_enum transB,
587  int m, int n, int k, int nb,
588  float alpha, const float *A, int lda,
589  const float *B, int ldb,
590  float beta, float *C, int ldc,
591  float *fake1, int szefake1, int flag1,
592  float *fake2, int szefake2, int flag2);
593 void QUARK_CORE_sgemm_p2(Quark *quark, Quark_Task_Flags *task_flags,
594  PLASMA_enum transA, PLASMA_enum transB,
595  int m, int n, int k, int nb,
596  float alpha, const float *A, int lda,
597  const float **B, int ldb,
598  float beta, float *C, int ldc);
599 void QUARK_CORE_sgemm_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
600  PLASMA_enum transA, PLASMA_enum transB,
601  int m, int n, int k, int nb,
602  float alpha, const float *A, int lda,
603  const float **B, int ldb,
604  float beta, float *C, int ldc,
605  float *fake1, int szefake1, int flag1);
606 void QUARK_CORE_sgemm_p3(Quark *quark, Quark_Task_Flags *task_flags,
607  PLASMA_enum transA, PLASMA_enum transB,
608  int m, int n, int k, int nb,
609  float alpha, const float *A, int lda,
610  const float *B, int ldb,
611  float beta, float **C, int ldc);
612 void QUARK_CORE_sgemm_tile(Quark *quark, Quark_Task_Flags *task_flags,
613  PLASMA_enum transA, PLASMA_enum transB,
614  int m, int n, int k, int nb,
615  const float *alpha, const float *A, int lda,
616  const float *B, int ldb,
617  const float *beta, float *C, int ldc,
618  const float *Alock,
619  const float *Block,
620  const float *Clock);
621 void QUARK_CORE_sgemv(Quark *quark, Quark_Task_Flags *task_flags,
622  PLASMA_enum trans, int m, int n,
623  float alpha, const float *A, int lda,
624  const float *x, int incx,
625  float beta, float *y, int incy);
626 void QUARK_CORE_sgemv_tile(Quark *quark, Quark_Task_Flags *task_flags,
627  PLASMA_enum trans,
628  int m, int n,
629  const float *alpha, const float *A, int lda,
630  const float *x, int incx,
631  const float *beta, float *y, int incy,
632  const float *Alock,
633  const float *xlock,
634  const float *ylock);
635 void QUARK_CORE_sgeqp3_init( Quark *quark, Quark_Task_Flags *task_flags,
636  int n, int *jpvt );
637 void QUARK_CORE_sgeqp3_larfg(Quark *quark, Quark_Task_Flags *task_flags,
638  PLASMA_desc A, int ii, int jj, int i, int j,
639  float *tau, float *beta );
640 void QUARK_CORE_sgeqp3_norms( Quark *quark, Quark_Task_Flags *task_flags,
641  PLASMA_desc A, int ioff, int joff, float *norms1, float *norms2 );
642 void QUARK_CORE_sgeqp3_pivot( Quark *quark, Quark_Task_Flags *task_flags,
643  PLASMA_desc A,
644  float *F, int ldf,
645  int jj, int k, int *jpvt,
646  float *norms1, float *norms2, int *info );
647 void QUARK_CORE_sgeqp3_tntpiv(Quark *quark, Quark_Task_Flags *task_flags,
648  int m, int n, int nb,
649  float *A, int lda,
650  int *IPIV,
651  PLASMA_sequence *sequence, PLASMA_request *request,
652  PLASMA_bool check_info, int iinfo);
653 void QUARK_CORE_sgeqp3_update( Quark *quark, Quark_Task_Flags *task_flags,
654  float *Ajj, int lda1,
655  float *Ajk, int lda2,
656  float *Fk, int ldf,
657  int joff, int k, int koff, int nb,
658  float *norms1, float *norms2, int *info );
659 void QUARK_CORE_sgeqrt(Quark *quark, Quark_Task_Flags *task_flags,
660  int m, int n, int ib, int nb,
661  float *A, int lda,
662  float *T, int ldt);
663 void QUARK_CORE_sgessm(Quark *quark, Quark_Task_Flags *task_flags,
664  int m, int n, int k, int ib, int nb,
665  const int *IPIV,
666  const float *L, int ldl,
667  float *A, int lda);
668 void QUARK_CORE_sgessq_f1( Quark *quark, Quark_Task_Flags *task_flags,
669  int m, int n, const float *A, int lda,
670  float *scale, float *sumsq,
671  float *fake, int szeF, int paramF );
672 void QUARK_CORE_sgetrf(Quark *quark, Quark_Task_Flags *task_flags,
673  int m, int n, int nb,
674  float *A, int lda,
675  int *IPIV,
676  PLASMA_sequence *sequence, PLASMA_request *request,
677  PLASMA_bool check_info, int iinfo);
678 void QUARK_CORE_sgetrf_incpiv(Quark *quark, Quark_Task_Flags *task_flags,
679  int m, int n, int ib, int nb,
680  float *A, int lda,
681  int *IPIV,
682  PLASMA_sequence *sequence, PLASMA_request *request,
683  PLASMA_bool check_info, int iinfo);
684 void QUARK_CORE_sgetrf_nopiv(Quark *quark, Quark_Task_Flags *task_flags,
685  int m, int n, int ib, int nb,
686  float *A, int lda,
687  PLASMA_sequence *sequence, PLASMA_request *request,
688  int iinfo);
689 void QUARK_CORE_sgetrf_reclap(Quark *quark, Quark_Task_Flags *task_flags,
690  CORE_sgetrf_data_t *data, int m, int n, int nb,
691  float *A, int lda,
692  int *IPIV,
693  PLASMA_sequence *sequence, PLASMA_request *request,
694  PLASMA_bool check_info, int iinfo,
695  int nbthread);
696 void QUARK_CORE_sgetrf_rectil(Quark *quark, Quark_Task_Flags *task_flags,
697  CORE_sgetrf_data_t *data,
698  PLASMA_desc A, float *Amn, int size,
699  int *IPIV,
700  PLASMA_sequence *sequence, PLASMA_request *request,
701  PLASMA_bool check_info, int iinfo,
702  int nbthread);
703 void QUARK_CORE_sgetrip(Quark *quark, Quark_Task_Flags *task_flags,
704  int m, int n, float *A, int szeA);
705 void QUARK_CORE_sgetrip_f1(Quark *quark, Quark_Task_Flags *task_flags,
706  int m, int n, float *A, int szeA,
707  float *fake, int szeF, int paramF);
708 void QUARK_CORE_sgetrip_f2(Quark *quark, Quark_Task_Flags *task_flags,
709  int m, int n, float *A, int szeA,
710  float *fake1, int szeF1, int paramF1,
711  float *fake2, int szeF2, int paramF2);
712 void QUARK_CORE_ssymm(Quark *quark, Quark_Task_Flags *task_flags,
713  PLASMA_enum side, PLASMA_enum uplo,
714  int m, int n, int nb,
715  float alpha, const float *A, int lda,
716  const float *B, int ldb,
717  float beta, float *C, int ldc);
718 void QUARK_CORE_ssygst(Quark *quark, Quark_Task_Flags *task_flags,
719  int itype, PLASMA_enum uplo, int N,
720  float *A, int LDA,
721  float *B, int LDB,
722  PLASMA_sequence *sequence, PLASMA_request *request,
723  int iinfo);
724 void QUARK_CORE_ssyrk(Quark *quark, Quark_Task_Flags *task_flags,
725  PLASMA_enum uplo, PLASMA_enum trans,
726  int n, int k, int nb,
727  float alpha, const float *A, int lda,
728  float beta, float *C, int ldc);
729 void QUARK_CORE_ssyr2k(Quark *quark, Quark_Task_Flags *task_flags,
730  PLASMA_enum uplo, PLASMA_enum trans,
731  int n, int k, int nb,
732  float alpha, const float *A, int lda,
733  const float *B, int LDB,
734  float beta, float *C, int ldc);
735 void QUARK_CORE_ssyrfb(Quark *quark, Quark_Task_Flags *task_flags,
736  PLASMA_enum uplo,
737  int n, int k, int ib, int nb,
738  const float *A, int lda,
739  const float *T, int ldt,
740  float *C, int ldc);
741 void QUARK_CORE_shessq_f1( Quark *quark, Quark_Task_Flags *task_flags,
742  PLASMA_enum uplo, int n, const float *A, int lda,
743  float *scale, float *sumsq,
744  float *fake, int szeF, int paramF );
745 void QUARK_CORE_slacpy(Quark *quark, Quark_Task_Flags *task_flags,
746  PLASMA_enum uplo, int m, int n, int mb,
747  const float *A, int lda,
748  float *B, int ldb);
749 void QUARK_CORE_slacpy_f1(Quark *quark, Quark_Task_Flags *task_flags,
750  PLASMA_enum uplo, int m, int n, int nb,
751  const float *A, int lda,
752  float *B, int ldb,
753  float *fake1, int szefake1, int flag1);
754 void QUARK_CORE_slacpy_pivot(Quark *quark, Quark_Task_Flags *task_flags,
755  const PLASMA_desc descA,
756  PLASMA_enum direct,
757  int k1, int k2, const int *ipiv,
758  int *rankin, int *rankout,
759  float *A, int lda,
760  int pos, int init);
761 void QUARK_CORE_slange(Quark *quark, Quark_Task_Flags *task_flags,
762  int norm, int M, int N,
763  const float *A, int LDA, int szeA,
764  int szeW, float *result);
765 void QUARK_CORE_slange_f1(Quark *quark, Quark_Task_Flags *task_flags,
766  int norm, int M, int N,
767  const float *A, int LDA, int szeA,
768  int szeW, float *result,
769  float *fake, int szeF);
770 #ifdef COMPLEX
771 void QUARK_CORE_slansy(Quark *quark, Quark_Task_Flags *task_flags,
772  int norm, PLASMA_enum uplo, int N,
773  const float *A, int LDA, int szeA,
774  int szeW, float *result);
775 void QUARK_CORE_slansy_f1(Quark *quark, Quark_Task_Flags *task_flags,
776  int norm, PLASMA_enum uplo, int N,
777  const float *A, int LDA, int szeA,
778  int szeW, float *result,
779  float *fake, int szeF);
780 #endif
781 void QUARK_CORE_slansy(Quark *quark, Quark_Task_Flags *task_flags,
782  int norm, PLASMA_enum uplo, int N,
783  const float *A, int LDA, int szeA,
784  int szeW, float *result);
785 void QUARK_CORE_slansy_f1(Quark *quark, Quark_Task_Flags *task_flags,
786  int norm, PLASMA_enum uplo, int N,
787  const float *A, int LDA, int szeA,
788  int szeW, float *result,
789  float *fake, int szeF);
790 void QUARK_CORE_slantr(Quark *quark, Quark_Task_Flags *task_flags,
791  PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag, int M, int N,
792  const float *A, int LDA, int szeA,
793  int szeW, float *result);
794 void QUARK_CORE_slantr_f1(Quark *quark, Quark_Task_Flags *task_flags,
795  PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag, int M, int N,
796  const float *A, int LDA, int szeA,
797  int szeW, float *result,
798  float *fake, int szeF);
799 void QUARK_CORE_slascal(Quark *quark, Quark_Task_Flags *task_flags,
800  PLASMA_enum uplo, int m, int n, int nb,
801  float alpha, float *A, int lda);
802 void QUARK_CORE_slaset(Quark *quark, Quark_Task_Flags *task_flags,
803  PLASMA_enum uplo, int n1, int n2, float alpha,
804  float beta, float *tileA, int ldtilea);
805 void QUARK_CORE_slaset2(Quark *quark, Quark_Task_Flags *task_flags,
806  PLASMA_enum uplo, int n1, int n2, float alpha,
807  float *tileA, int ldtilea);
808 void QUARK_CORE_slaswp(Quark *quark, Quark_Task_Flags *task_flags,
809  int n, float *A, int lda,
810  int i1, int i2, const int *ipiv, int inc);
811 void QUARK_CORE_slaswp_f2(Quark *quark, Quark_Task_Flags *task_flags,
812  int n, float *A, int lda,
813  int i1, int i2, const int *ipiv, int inc,
814  float *fake1, int szefake1, int flag1,
815  float *fake2, int szefake2, int flag2);
816 void QUARK_CORE_slaswp_ontile(Quark *quark, Quark_Task_Flags *task_flags,
817  PLASMA_desc descA, float *A,
818  int i1, int i2, const int *ipiv, int inc, float *fakepanel);
819 void QUARK_CORE_slaswp_ontile_f2(Quark *quark, Quark_Task_Flags *task_flags,
820  PLASMA_desc descA, float *A,
821  int i1, int i2, const int *ipiv, int inc,
822  float *fake1, int szefake1, int flag1,
823  float *fake2, int szefake2, int flag2);
824 void QUARK_CORE_slaswpc_ontile(Quark *quark, Quark_Task_Flags *task_flags,
825  PLASMA_desc descA, float *A,
826  int i1, int i2, const int *ipiv, int inc, float *fakepanel);
827 void QUARK_CORE_slatro(Quark *quark, Quark_Task_Flags *task_flags,
828  PLASMA_enum uplo, PLASMA_enum trans, int m, int n, int mb,
829  const float *A, int lda,
830  float *B, int ldb);
831 void QUARK_CORE_slatro_f1(Quark *quark, Quark_Task_Flags *task_flags,
832  PLASMA_enum uplo, PLASMA_enum trans, int m, int n, int mb,
833  const float *A, int lda,
834  float *B, int ldb,
835  float *fake1, int szefake1, int flag1);
836 void QUARK_CORE_slauum(Quark *quark, Quark_Task_Flags *task_flags,
837  PLASMA_enum uplo, int n, int nb,
838  float *A, int lda);
839 void QUARK_CORE_splgsy(Quark *quark, Quark_Task_Flags *task_flags,
840  float bump, int m, int n, float *A, int lda,
841  int bigM, int m0, int n0, unsigned long long int seed );
842 void QUARK_CORE_splgsy(Quark *quark, Quark_Task_Flags *task_flags,
843  float bump, int m, int n, float *A, int lda,
844  int bigM, int m0, int n0, unsigned long long int seed );
845 void QUARK_CORE_splrnt(Quark *quark, Quark_Task_Flags *task_flags,
846  int m, int n, float *A, int lda,
847  int bigM, int m0, int n0, unsigned long long int seed );
848 void QUARK_CORE_spltmg(Quark *quark, Quark_Task_Flags *task_flags,
849  PLASMA_enum mtxtype, int m, int n, float *A, int lda,
850  int gM, int gN, int m0, int n0, unsigned long long int seed );
851 void QUARK_CORE_spltmg_chebvand( Quark *quark, Quark_Task_Flags *task_flags,
852  int M, int N, float *A, int LDA,
853  int gN, int m0, int n0,
854  float *W );
855 void QUARK_CORE_spltmg_circul( Quark *quark, Quark_Task_Flags *task_flags,
856  int M, int N, float *A, int LDA,
857  int gM, int m0, int n0,
858  const float *W );
859 void QUARK_CORE_spltmg_fiedler(Quark *quark, Quark_Task_Flags *task_flags,
860  int m, int n,
861  const float *X, int incX,
862  const float *Y, int incY,
863  float *A, int lda);
864 void QUARK_CORE_spltmg_hankel( Quark *quark, Quark_Task_Flags *task_flags,
865  PLASMA_enum uplo, int M, int N, float *A, int LDA,
866  int m0, int n0, int nb,
867  const float *V1,
868  const float *V2);
869 void QUARK_CORE_spltmg_toeppd1(Quark *quark, Quark_Task_Flags *task_flags,
870  int gM, int m0, int M,
871  float *W,
872  unsigned long long int seed);
873 void QUARK_CORE_spltmg_toeppd2(Quark *quark, Quark_Task_Flags *task_flags,
874  int M, int N, int K, int m0, int n0,
875  const float *W,
876  float *A, int LDA );
877 void QUARK_CORE_spotrf(Quark *quark, Quark_Task_Flags *task_flags,
878  PLASMA_enum uplo, int n, int nb,
879  float *A, int lda,
880  PLASMA_sequence *sequence, PLASMA_request *request,
881  int iinfo);
882 void QUARK_CORE_ssetvar(Quark *quark, Quark_Task_Flags *task_flags,
883  const float *alpha, float *x,
884  float *Alock);
885 void QUARK_CORE_sshift( Quark *quark, Quark_Task_Flags *task_flags,
886  int s, int m, int n, int L,
887  float *A);
888 void QUARK_CORE_sshiftw(Quark *quark, Quark_Task_Flags *task_flags,
889  int s, int cl, int m, int n, int L,
890  float *A, float *W);
891 void QUARK_CORE_sssssm(Quark *quark, Quark_Task_Flags *task_flags,
892  int m1, int n1, int m2, int n2, int k, int ib, int nb,
893  float *A1, int lda1,
894  float *A2, int lda2,
895  const float *L1, int ldl1,
896  const float *L2, int ldl2,
897  const int *IPIV);
898 void QUARK_CORE_sstedc(Quark *quark, Quark_Task_Flags *task_flags,
899  PLASMA_enum compz, int n,
900  float *D, float *E,
901  float *Z, int ldz);
902 void QUARK_CORE_sstedc_f2(Quark *quark, Quark_Task_Flags *task_flags,
903  PLASMA_enum compz, int n,
904  float *D, float *E,
905  float *Z, int ldz,
906  void *fake1, int szefake1, int flag1,
907  void *fake2, int szefake2, int flag2);
908 void QUARK_CORE_ssteqr(Quark *quark, Quark_Task_Flags *task_flags,
909  PLASMA_enum compz, int n,
910  float *D, float *E,
911  float *Z, int ldz);
912 void QUARK_CORE_ssymm(Quark *quark, Quark_Task_Flags *task_flags,
913  PLASMA_enum side, PLASMA_enum uplo,
914  int m, int n, int nb,
915  float alpha, const float *A, int lda,
916  const float *B, int ldb,
917  float beta, float *C, int ldc);
918 void QUARK_CORE_ssyrk(Quark *quark, Quark_Task_Flags *task_flags,
919  PLASMA_enum uplo, PLASMA_enum trans,
920  int n, int k, int nb,
921  float alpha, const float *A, int lda,
922  float beta, float *C, int ldc);
923 void QUARK_CORE_ssyr2k(Quark *quark, Quark_Task_Flags *task_flags,
924  PLASMA_enum uplo, PLASMA_enum trans,
925  int n, int k, int nb,
926  float alpha, const float *A, int lda,
927  const float *B, int LDB,
928  float beta, float *C, int ldc);
929 void QUARK_CORE_ssyssq_f1( Quark *quark, Quark_Task_Flags *task_flags,
930  PLASMA_enum uplo, int n, const float *A, int lda,
931  float *scale, float *sumsq,
932  float *fake, int szeF, int paramF );
933 void QUARK_CORE_sswpab(Quark *quark, Quark_Task_Flags *task_flags,
934  int i, int n1, int n2,
935  float *A, int szeA);
936 void QUARK_CORE_sswptr_ontile(Quark *quark, Quark_Task_Flags *task_flags,
937  PLASMA_desc descA, float *Aij,
938  int i1, int i2, const int *ipiv, int inc,
939  const float *Akk, int ldak);
940 void QUARK_CORE_stradd(Quark *quark, Quark_Task_Flags *task_flags,
941  PLASMA_enum uplo, PLASMA_enum trans, int m, int n, int nb,
942  float alpha,
943  const float *A, int lda,
944  float beta,
945  float *B, int ldb);
946 void QUARK_CORE_strasm(Quark *quark, Quark_Task_Flags *task_flags,
947  PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag, int m, int n,
948  const float *A, int lda, int szeA,
949  float *work, int szeW);
950 void QUARK_CORE_strasm_f1(Quark *quark, Quark_Task_Flags *task_flags,
951  PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag, int m, int n,
952  const float *A, int lda, int szeA,
953  float *work, int szeW,
954  float *fake, int szeF);
955 void QUARK_CORE_strdalg1(Quark *quark, Quark_Task_Flags *task_flags,
956  int n,
957  int nb,
958  float *A,
959  int lda,
960  float *V,
961  float *TAU,
962  int Vblksiz, int wantz,
963  int i, int sweepid, int m, int grsiz,
964  int *PCOL, int *ACOL, int *MCOL);
965 void QUARK_CORE_strmm(Quark *quark, Quark_Task_Flags *task_flags,
966  PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag,
967  int m, int n, int nb,
968  float alpha, const float *A, int lda,
969  float *B, int ldb);
970 void QUARK_CORE_strmm_p2(Quark *quark, Quark_Task_Flags *task_flags,
971  PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag,
972  int m, int n, int nb,
973  float alpha, const float *A, int lda,
974  float **B, int ldb);
975 void QUARK_CORE_strsm(Quark *quark, Quark_Task_Flags *task_flags,
976  PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag,
977  int m, int n, int nb,
978  float alpha, const float *A, int lda,
979  float *B, int ldb);
980 void QUARK_CORE_strssq_f1( Quark *quark, Quark_Task_Flags *task_flags,
981  PLASMA_enum uplo, PLASMA_enum diag,
982  int m, int n, const float *A, int lda,
983  float *scale, float *sumsq,
984  float *fake, int szeF, int paramF );
985 void QUARK_CORE_strtri(Quark *quark, Quark_Task_Flags *task_flags,
986  PLASMA_enum uplo, PLASMA_enum diag, int n, int nb,
987  float *A, int lda,
988  PLASMA_sequence *sequence, PLASMA_request *request,
989  int iinfo);
990 void QUARK_CORE_stslqt(Quark *quark, Quark_Task_Flags *task_flags,
991  int m, int n, int ib, int nb,
992  float *A1, int lda1,
993  float *A2, int lda2,
994  float *T, int ldt);
995 void QUARK_CORE_stsmlq(Quark *quark, Quark_Task_Flags *task_flags,
996  PLASMA_enum side, PLASMA_enum trans,
997  int m1, int n1, int m2, int n2, int k, int ib, int nb,
998  float *A1, int lda1,
999  float *A2, int lda2,
1000  const float *V, int ldv,
1001  const float *T, int ldt);
1002 void QUARK_CORE_stsmlq_sytra1(Quark *quark, Quark_Task_Flags *task_flags,
1003  PLASMA_enum side, PLASMA_enum trans,
1004  int m1, int n1, int m2, int n2, int k, int ib, int nb,
1005  float *A1, int lda1,
1006  float *A2, int lda2,
1007  const float *V, int ldv,
1008  const float *T, int ldt);
1009 void QUARK_CORE_stsmlq_corner(Quark *quark, Quark_Task_Flags *task_flags,
1010  int m1, int n1, int m2, int n2, int m3, int n3, int k, int ib, int nb,
1011  float *A1, int lda1,
1012  float *A2, int lda2,
1013  float *A3, int lda3,
1014  const float *V, int ldv,
1015  const float *T, int ldt);
1016 void QUARK_CORE_stsmqr(Quark *quark, Quark_Task_Flags *task_flags,
1017  PLASMA_enum side, PLASMA_enum trans,
1018  int m1, int n1, int m2, int n2, int k, int ib, int nb,
1019  float *A1, int lda1,
1020  float *A2, int lda2,
1021  const float *V, int ldv,
1022  const float *T, int ldt);
1023 void QUARK_CORE_stsmqr_sytra1(Quark *quark, Quark_Task_Flags *task_flags,
1024  PLASMA_enum side, PLASMA_enum trans,
1025  int m1, int n1, int m2, int n2, int k, int ib, int nb,
1026  float *A1, int lda1,
1027  float *A2, int lda2,
1028  const float *V, int ldv,
1029  const float *T, int ldt);
1030 void QUARK_CORE_stsmqr_corner(Quark *quark, Quark_Task_Flags *task_flags,
1031  int m1, int n1, int m2, int n2, int m3, int n3, int k, int ib, int nb,
1032  float *A1, int lda1,
1033  float *A2, int lda2,
1034  float *A3, int lda3,
1035  const float *V, int ldv,
1036  const float *T, int ldt);
1037 void QUARK_CORE_stsqrt(Quark *quark, Quark_Task_Flags *task_flags,
1038  int m, int n, int ib, int nb,
1039  float *A1, int lda1,
1040  float *A2, int lda2,
1041  float *T, int ldt);
1042 void QUARK_CORE_ststrf(Quark *quark, Quark_Task_Flags *task_flags,
1043  int m, int n, int ib, int nb,
1044  float *U, int ldu,
1045  float *A, int lda,
1046  float *L, int ldl,
1047  int *IPIV,
1048  PLASMA_sequence *sequence, PLASMA_request *request,
1049  PLASMA_bool check_info, int iinfo);
1050 void QUARK_CORE_sttmqr(Quark *quark, Quark_Task_Flags *task_flags,
1051  PLASMA_enum side, PLASMA_enum trans,
1052  int m1, int n1, int m2, int n2, int k, int ib, int nb,
1053  float *A1, int lda1,
1054  float *A2, int lda2,
1055  const float *V, int ldv,
1056  const float *T, int ldt);
1057 void QUARK_CORE_sttqrt(Quark *quark, Quark_Task_Flags *task_flags,
1058  int m, int n, int ib, int nb,
1059  float *A1, int lda1,
1060  float *A2, int lda2,
1061  float *T, int ldt);
1062 void QUARK_CORE_sttmlq(Quark *quark, Quark_Task_Flags *task_flags,
1063  PLASMA_enum side, PLASMA_enum trans,
1064  int m1, int n1, int m2, int n2, int k, int ib, int nb,
1065  float *A1, int lda1,
1066  float *A2, int lda2,
1067  const float *V, int ldv,
1068  const float *T, int ldt);
1069 void QUARK_CORE_sttlqt(Quark *quark, Quark_Task_Flags *task_flags,
1070  int m, int n, int ib, int nb,
1071  float *A1, int lda1,
1072  float *A2, int lda2,
1073  float *T, int ldt);
1074 void QUARK_CORE_spamm(Quark *quark, Quark_Task_Flags *task_flags,
1075  int op, PLASMA_enum side, PLASMA_enum storev,
1076  int m, int n, int k, int l,
1077  const float *A1, int lda1,
1078  float *A2, int lda2,
1079  const float *V, int ldv,
1080  float *W, int ldw);
1081 void QUARK_CORE_splssq( Quark *quark, Quark_Task_Flags *task_flags,
1082  int m, const float *A, float *result );
1083 void QUARK_CORE_sormlq(Quark *quark, Quark_Task_Flags *task_flags,
1084  PLASMA_enum side, PLASMA_enum trans,
1085  int m, int n, int ib, int nb, int k,
1086  const float *A, int lda,
1087  const float *T, int ldt,
1088  float *C, int ldc);
1089 void QUARK_CORE_sormqr(Quark *quark, Quark_Task_Flags *task_flags,
1090  PLASMA_enum side, PLASMA_enum trans,
1091  int m, int n, int k, int ib, int nb,
1092  const float *A, int lda,
1093  const float *T, int ldt,
1094  float *C, int ldc);
1095 
1096 
1097 void QUARK_CORE_slascl(Quark *quark, Quark_Task_Flags *task_flags,
1098  PLASMA_enum type, int kl, int ku, float cfrom, float cto,
1099  int m, int n, float *A, int lda);
1100 void QUARK_CORE_slascl_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
1101  PLASMA_enum type, int kl, int ku, float *cfrom, float *cto,
1102  int m, int n, float *A, int lda,
1103  void *fake, int szefake, int flag);
1104 void QUARK_CORE_slaed0_lascl( Quark *quark, Quark_Task_Flags *task_flags,
1105  int n, float *scale, float *D, float *E);
1106 void QUARK_CORE_slaed0_betaapprox(Quark *quark, Quark_Task_Flags *task_flags,
1107  int subpbs, const int *subpbs_info,
1108  float *D, const float *E);
1109 
1110 #ifndef COMPLEX
1111 void QUARK_CORE_slaed2_computeK(Quark *quark, Quark_Task_Flags *task_flags,
1112  int *K1, int n, int n1,
1113  float *beta, float *D, float *Q, int LDQ,
1114  float *Z, float *DLAMBDA, float *W,
1115  int *INDX, int *INDXC, int *INDXP, int *INDXQ,
1116  int *COLTYP,
1117  float **Qmerge, int wsmode,
1118  int *K2);
1119 
1120 void QUARK_CORE_slaed1_pipelined(Quark *quark, Quark_Task_Flags *task_flags,
1121  int n, int n1, const int *K,
1122  const int *INDX, const int *ctot,
1123  float *D, const float *beta,
1124  float *Q, int LDQ, float *Q2,
1125  const float *DLAMBDA, const float *W, float *Wred,
1126  int start, int end);
1127 void QUARK_CORE_slaed2_compressq(Quark *quark, Quark_Task_Flags *task_flags,
1128  int n, int n1, int start, int end,
1129  const int *INDX, const int *ctot,
1130  const float *Q, int LDQ,
1131  float *Q2, int *K);
1132 void QUARK_CORE_slaed4_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
1133  int n, const int *K,
1134  float *D, const float *beta,
1135  float **Q, const int *LDQ,
1136  const float *DLAMBDA, const float *W, const int *INDX,
1137  int start, int end,
1138  PLASMA_sequence *sequence, PLASMA_request *request,
1139  void *fakeQ, int flagfQ);
1140 void QUARK_CORE_slaed3_compW_p2f1(Quark *quark, Quark_Task_Flags *task_flags,
1141  int n, const int *K,
1142  float **Q, const int *LDQ,
1143  const float *DLAMBDA, float *W,
1144  const int *INDX,
1145  int start, int end,
1146  void *fakeQ, int flagfQ,
1147  void *fakeW, int flagfW);
1148 
1149 void QUARK_CORE_slaed3_reduceW(Quark *quark, Quark_Task_Flags *task_flags,
1150  int n, int n1, const int *K, int l,
1151  const float *Q, int LDQ,
1152  const float *Wred, float *W);
1153 void QUARK_CORE_slaed3_reduceW_p2(Quark *quark, Quark_Task_Flags *task_flags,
1154  int n, int n1, const int *K, int l,
1155  float **Q, const int *LDQ,
1156  const float *Wred, float *W);
1157 
1158 void QUARK_CORE_slaed2_copydef(Quark *quark, Quark_Task_Flags *task_flags,
1159  int n, int n1, const int *K, const int *ctot,
1160  float *Q, int LDQ, const float *Q2,
1161  int start, int end);
1162 void QUARK_CORE_slaed3_computevectors(Quark *quark, Quark_Task_Flags *task_flags,
1163  int wsmode, int n, const int *K,
1164  const int *il_nondef, const int *iu_nondef,
1165  float *Q, int LDQ, float *W, const int *INDXC,
1166  float **WSglobal, float **WSlocal,
1167  int start, int end );
1168 void QUARK_CORE_slaed3_wscopy( Quark *quark, Quark_Task_Flags *task_flags,
1169  const int *K, const int *il_nondef, const int *iu_nondef,
1170  const float *Q, int LDQ, float **WORK,
1171  int start, int end );
1172 void QUARK_CORE_slaed3_updatevectors(Quark *quark, Quark_Task_Flags *task_flags,
1173  int oper, int wsmode, int n, int n1, int *K,
1174  int *il_nondef, int *iu_nondef,
1175  float *D, float *Q, int LDQ, float *Q2,
1176  int *INDXQ, int *COLTYP, float **WORK,
1177  int start, int end, float **WORKDEP);
1178 void QUARK_CORE_slaed3_pipelined(Quark *quark, Quark_Task_Flags *task_flags,
1179  int n, int n1, int *K, int *il_nondef, int *iu_nondef,
1180  float *D, float *Q, int LDQ, float *Q2,
1181  int *INDXC, int *INDXQ, int *COLTYP, float *W,
1182  int start, int end2);
1183 
1184 void QUARK_CORE_sDC_fakedep(Quark *quark, Quark_Task_Flags *task_flags,
1185  int nb_tasks, int nb, float *Q, int LDQ, float *W);
1186 #endif
1187 
1188 void QUARK_CORE_sswap(Quark *quark, Quark_Task_Flags *task_flags,
1189  int m, int n, float *Q,
1190  int LDQ, float *work,
1191  int *perm, int begin, int end);
1192 #ifdef COMPLEX
1193 void QUARK_CORE_slag2c(Quark *quark, Quark_Task_Flags *task_flags,
1194  int m, int n,
1195  const float *Q, int LDQ,
1196  float *Z, int LDZ);
1197 #endif
1198 void QUARK_CORE_slaed3_freebigwork(Quark *quark, Quark_Task_Flags *task_flags,
1199  int *K_bis, int largework, float **WORK);
1200 void QUARK_CORE_slaset_identity(Quark *quark, Quark_Task_Flags *task_flags,
1201  int n, int start, int size,
1202  float *A);
1203 
1207 void CORE_sasum_quark(Quark *quark);
1208 void CORE_sasum_f1_quark(Quark *quark);
1209 void CORE_sgeadd_quark(Quark *quark);
1210 void CORE_sbrdalg1_quark(Quark *quark);
1211 void CORE_sgelqt_quark(Quark *quark);
1212 void CORE_sgemm_quark(Quark *quark);
1213 void CORE_sgemm_tile_quark(Quark *quark);
1214 void CORE_sgemv_quark(Quark *quark);
1215 void CORE_sgemv_tile_quark(Quark *quark);
1216 void CORE_sgeqp3_init_quark(Quark *quark);
1217 void CORE_sgeqp3_larfg_quark(Quark *quark);
1218 void CORE_sgeqp3_norms_quark(Quark *quark);
1219 void CORE_sgeqp3_pivot_quark(Quark *quark);
1220 void CORE_sgeqp3_tntpiv_quark(Quark *quark);
1221 void CORE_sgeqp3_update_quark(Quark *quark);
1222 void CORE_sgeqrt_quark(Quark *quark);
1223 void CORE_sgessm_quark(Quark *quark);
1224 void CORE_sgessq_quark(Quark *quark);
1225 void CORE_sgessq_f1_quark(Quark *quark);
1226 void CORE_sgetrf_quark(Quark *quark);
1227 void CORE_sgetrf_incpiv_quark(Quark *quark);
1228 void CORE_sgetrf_nopiv_quark(Quark* quark);
1229 void CORE_sgetrf_reclap_quark(Quark *quark);
1230 void CORE_sgetrf_rectil_quark(Quark* quark);
1231 void CORE_sgetrip_quark(Quark *quark);
1232 void CORE_sgetrip_f1_quark(Quark *quark);
1233 void CORE_sgetrip_f2_quark(Quark *quark);
1234 #ifdef COMPLEX
1235 void CORE_ssymm_quark(Quark *quark);
1236 void CORE_ssyrk_quark(Quark *quark);
1237 void CORE_ssyr2k_quark(Quark *quark);
1238 #endif
1239 void CORE_ssygst_quark(Quark *quark);
1240 void CORE_ssyrfb_quark(Quark *quark);
1241 void CORE_shessq_quark(Quark *quark);
1242 void CORE_shessq_f1_quark(Quark *quark);
1243 void CORE_slacpy_quark(Quark *quark);
1244 void CORE_slacpy_f1_quark(Quark *quark);
1245 void CORE_slacpy_pivot_quark(Quark *quark);
1246 void CORE_slatro_quark(Quark *quark);
1247 void CORE_slatro_f1_quark(Quark *quark);
1248 void CORE_slange_quark(Quark *quark);
1249 void CORE_slange_f1_quark(Quark *quark);
1250 #ifdef COMPLEX
1251 void CORE_slansy_quark(Quark *quark);
1252 void CORE_slansy_f1_quark(Quark *quark);
1253 #endif
1254 void CORE_slansy_quark(Quark *quark);
1255 void CORE_slansy_f1_quark(Quark *quark);
1256 void CORE_slaset_quark(Quark *quark);
1257 void CORE_slaset2_quark(Quark *quark);
1258 void CORE_slatro_quark(Quark *quark);
1259 void CORE_slauum_quark(Quark *quark);
1260 void CORE_spamm_quark(Quark *quark);
1261 void CORE_splgsy_quark(Quark *quark);
1262 void CORE_splgsy_quark(Quark *quark);
1263 void CORE_splrnt_quark(Quark *quark);
1264 void CORE_spltmg_quark(Quark *quark);
1265 void CORE_splssq_quark(Quark *quark);
1266 void CORE_spotrf_quark(Quark *quark);
1267 void CORE_ssetvar_quark(Quark *quark);
1268 void CORE_sshift_quark(Quark *quark);
1269 void CORE_sshiftw_quark(Quark *quark);
1270 void CORE_sssssm_quark(Quark *quark);
1271 void CORE_ssymm_quark(Quark *quark);
1272 void CORE_ssyrk_quark(Quark *quark);
1273 void CORE_ssyr2k_quark(Quark *quark);
1274 void CORE_ssyssq_quark(Quark *quark);
1275 void CORE_ssyssq_f1_quark(Quark *quark);
1276 void CORE_sswpab_quark(Quark *quark);
1277 void CORE_sswptr_ontile_quark(Quark *quark);
1278 void CORE_strdalg1_quark(Quark *quark);
1279 void CORE_strmm_quark(Quark *quark);
1280 void CORE_strsm_quark(Quark *quark);
1281 void CORE_strtri_quark(Quark *quark);
1282 void CORE_stslqt_quark(Quark *quark);
1283 void CORE_stsmlq_quark(Quark *quark);
1284 void CORE_stsmlq_sytra1_quark(Quark *quark);
1285 void CORE_stsmlq_corner_quark(Quark *quark);
1286 void CORE_stsmqr_quark(Quark *quark);
1287 void CORE_stsmqr_sytra1_quark(Quark *quark);
1288 void CORE_stsmqr_corner_quark(Quark *quark);
1289 void CORE_stsqrt_quark(Quark *quark);
1290 void CORE_ststrf_quark(Quark *quark);
1291 void CORE_sttmqr_quark(Quark *quark);
1292 void CORE_sttqrt_quark(Quark *quark);
1293 void CORE_sttmlq_quark(Quark *quark);
1294 void CORE_sttlqt_quark(Quark *quark);
1295 void CORE_sormlq_quark(Quark *quark);
1296 void CORE_sormqr_quark(Quark *quark);
1297 void CORE_slaswp_quark(Quark* quark);
1298 void CORE_slaswp_f2_quark(Quark* quark);
1299 void CORE_slaswp_ontile_quark(Quark *quark);
1300 void CORE_slaswp_ontile_f2_quark(Quark *quark);
1301 void CORE_slaswpc_ontile_quark(Quark *quark);
1302 void CORE_strmm_p2_quark(Quark* quark);
1303 void CORE_sgemm_f2_quark(Quark* quark);
1304 void CORE_sgemm_p2_quark(Quark* quark);
1305 void CORE_sgemm_p2f1_quark(Quark* quark);
1306 void CORE_sgemm_p3_quark(Quark* quark);
1307 
1308 #endif /* defined(QUARK_H) */
1309 
1310 #ifdef __cplusplus
1311 }
1312 #endif
1313 
1314 #undef COMPLEX
1315 
1316 #endif
void CORE_slaed0_betaapprox(int subpbs, const int *subpbs_info, float *D, const float *E)
Definition: core_slaed0_betaapprox.c:49
int CORE_sttqrt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sttqrt.c:116
int CORE_stsmlq(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_stsmlq.c:124
int CORE_sgetf2_nopiv(int m, int n, float *A, int lda)
Definition: core_sgetf2_nopiv.c:64
void CORE_spotrf(PLASMA_enum uplo, int N, float *A, int LDA, int *INFO)
Definition: core_spotrf.c:68
int CORE_slarfx2c(PLASMA_enum uplo, float V, float TAU, float *C1, float *C2, float *C3)
Definition: core_slarfx_tbrd.c:177
void CORE_slaed3_computeW(int n, int K, const float *Q, int LDQ, const float *DLAMBDA, float *W, const int *INDX, int start, int end)
Definition: core_slaed3_computeW.c:66
int CORE_sswptr_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc, const float *Akk, int ldak)
Definition: core_slaswp.c:224
void CORE_sgbtype1cb(PLASMA_enum uplo, int N, int NB, float *A, int LDA, float *VQ, float *TAUQ, float *VP, float *TAUP, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_sgbtype1cb.c:124
void CORE_strsm(PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag, int M, int N, float alpha, const float *A, int LDA, float *B, int LDB)
Definition: core_strsm.c:80
int CORE_sttmlq(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_sttmlq.c:116
int CORE_spltmg_chebvand(int M, int N, float *A, int LDA, int gN, int m0, int n0, float *W)
Definition: core_spltmg_chebvand.c:83
int CORE_spamm(int op, PLASMA_enum side, PLASMA_enum storev, int M, int N, int K, int L, const float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, float *W, int LDW)
Definition: core_spamm.c:175
void CORE_ssyrk(PLASMA_enum uplo, PLASMA_enum trans, int N, int K, float alpha, const float *A, int LDA, float beta, float *C, int LDC)
Definition: core_ssyrk.c:80
void CORE_ssbtype2cb(int N, int NB, float *A, int LDA, float *V, float *TAU, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_ssbtype2cb.c:104
void CORE_sgeqp3_larfg(PLASMA_desc A, int ii, int jj, int i, int j, float *tau, float *beta)
Definition: core_sgeqp3_larfg.c:78
int CORE_shbrce(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_shbrce.c:78
void CORE_sswap(int m, int n, float *Q, int ldq, const float *work, const int *perm, int start, int end)
Definition: core_sswap.c:67
void CORE_slaed2_copydef(int n, int n1, int K, const int *ctot, float *Q, int LDQ, const float *Q2, int start, int end)
Definition: core_slaed2_compressq.c:180
void CORE_slaed3_merge(int n, int K, float *D, int *INDXQ)
Definition: core_slaed3_merge.c:46
int CORE_spltmg(PLASMA_enum mtxtype, int m, int n, float *A, int lda, int gM, int gN, int m0, int n0, unsigned long long int seed)
Definition: core_spltmg.c:90
int CORE_slaswp_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc)
Definition: core_slaswp.c:107
void CORE_slaset(PLASMA_enum uplo, int n1, int n2, float alpha, float beta, float *tileA, int ldtilea)
Definition: core_slaset.c:57
int CORE_ssyrfb(PLASMA_enum uplo, int N, int K, int IB, int NB, const float *A, int LDA, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_ssyrfb.c:110
int CORE_sgessm(int M, int N, int K, int IB, const int *IPIV, const float *L, int LDL, float *A, int LDA)
Definition: core_sgessm.c:70
int CORE_shblrx(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_shblrx.c:78
int CORE_slarfx2(PLASMA_enum side, int N, float V, float TAU, float *C1, int LDC1, float *C2, int LDC2)
Definition: core_slarfx_tbrd.c:82
void CORE_sgeqp3_pivot(PLASMA_desc A, float *F, int ldf, int jj, int k, int *jpvt, float *norms1, float *norms2, int *info)
Definition: core_sgeqp3_pivot.c:68
void CORE_sshiftw(int s, int cl, int m, int n, int L, float *A, float *W)
Definition: core_sshift.c:66
void CORE_strasm(PLASMA_enum storev, PLASMA_enum uplo, PLASMA_enum diag, int M, int N, const float *A, int lda, float *work)
Definition: core_strasm.c:66
void CORE_spltmg_condexq(int M, int N, float *Q, int LDQ)
Definition: core_spltmg_condex.c:53
void CORE_sgeqp3_update(const float *Ajj, int lda1, float *Ajk, int lda2, const float *Fk, int ldf, int joff, int k, int koff, int nb, float *norms1, float *norms2, int *info)
Definition: core_sgeqp3_update.c:82
int CORE_slag2c(int m, int n, const float *R, int ldr, PLASMA_Complex32_t *Z, int ldz)
Definition: core_slag2c.c:58
void CORE_slaed2_compressq(int n, int n1, const int *INDX, const int *ctot, const float *Q, int LDQ, float *Q2, int start, int end)
Definition: core_slaed2_compressq.c:85
void CORE_sgeqp3_norms(PLASMA_desc A, int ioff, int joff, float *norms1, float *norms2)
Definition: core_sgeqp3_norms.c:62
void CORE_ssygst(int itype, PLASMA_enum uplo, int N, float *A, int LDA, float *B, int LDB, int *INFO)
Definition: core_ssygst.c:80
int CORE_sgetrf_reclap(CORE_sgetrf_data_t *data, int M, int N, float *A, int LDA, int *IPIV, int *info)
Definition: core_sgetrf_reclap.c:123
void CORE_strmm(PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag, int M, int N, float alpha, const float *A, int LDA, float *B, int LDB)
Definition: core_strmm.c:84
void CORE_slantr(PLASMA_enum norm, PLASMA_enum uplo, PLASMA_enum diag, int M, int N, const float *A, int LDA, float *work, float *normA)
Definition: core_slantr.c:86
int CORE_sgetrf_incpiv(int M, int N, int IB, float *A, int LDA, int *IPIV, int *INFO)
Definition: core_sgetrf_incpiv.c:83
int CORE_stsmqr(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_stsmqr.c:124
int CORE_sgetrf_rectil(CORE_sgetrf_data_t *data, const PLASMA_desc A, int *IPIV, int *info)
Definition: core_sgetrf_rectil.c:120
void CORE_sbrdalg1(PLASMA_enum uplo, int n, int nb, float *A, int lda, float *VQ, float *TAUQ, float *VP, float *TAUP, int Vblksiz, int wantz, int i, int sweepid, int m, int grsiz, float *work)
Definition: core_sbrdalg1.c:111
int CORE_sparfb(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev, int M1, int N1, int M2, int N2, int K, int L, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_sparfb.c:132
void CORE_slaed3_updatevectors(int op, int wsmode, int n, int n1, int K, int il_nondef, int iu_nondef, float *Q, int ldq, float *Q2, const int *ctot, float *WORK, int start, int end)
Definition: core_slaed3_updatevectors.c:95
int CORE_stsmqr_corner(int m1, int n1, int m2, int n2, int m3, int n3, int k, int ib, int nb, float *A1, int lda1, float *A2, int lda2, float *A3, int lda3, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmqr_corner.c:130
int CORE_stradd(PLASMA_enum uplo, PLASMA_enum trans, int M, int N, float alpha, const float *A, int LDA, float beta, float *B, int LDB)
Definition: core_stradd.c:86
int CORE_sgbrce(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_sgbrce.c:78
int CORE_stsmlq_corner(int m1, int n1, int m2, int n2, int m3, int n3, int k, int ib, int nb, float *A1, int lda1, float *A2, int lda2, float *A3, int lda3, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmlq_corner.c:130
void CORE_ssbtype1cb(int N, int NB, float *A, int LDA, float *V, float *TAU, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_ssbtype1cb.c:100
int CORE_sttmqr(PLASMA_enum side, PLASMA_enum trans, int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *V, int LDV, const float *T, int LDT, float *WORK, int LDWORK)
Definition: core_sttmqr.c:116
int CORE_sgeqrt(int M, int N, int IB, float *A, int LDA, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sgeqrt.c:86
void CORE_splrnt(int m, int n, float *A, int lda, int bigM, int m0, int n0, unsigned long long int seed)
Definition: core_splrnt.c:68
void CORE_slauum(PLASMA_enum uplo, int N, float *A, int LDA)
Definition: core_slauum.c:57
void CORE_ssbtype3cb(int N, int NB, float *A, int LDA, const float *V, const float *TAU, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_ssbtype3cb.c:101
void CORE_slange(int norm, int M, int N, const float *A, int LDA, float *work, float *normA)
Definition: core_slange.c:72
int CORE_slatro(PLASMA_enum uplo, PLASMA_enum trans, int M, int N, const float *A, int LDA, float *B, int LDB)
Definition: core_slatro.c:80
Definition: plasma.h:34
void CORE_strdalg1(int n, int nb, float *A, int lda, float *V, float *TAU, int Vblksiz, int wantz, int i, int sweepid, int m, int grsiz, float *work)
Definition: core_strdalg1.c:91
Definition: core_sgetrf_reclap.c:24
int CORE_slarfx2ce(PLASMA_enum uplo, float *V, float *TAU, float *C1, float *C2, float *C3)
Definition: core_slarfx_tbrd.c:323
int CORE_sgbelr(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_sgbelr.c:81
int CORE_stsmqr_sytra1(PLASMA_enum side, PLASMA_enum trans, int m1, int n1, int m2, int n2, int k, int ib, float *A1, int lda1, float *A2, int lda2, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmqr_sytra1.c:127
int CORE_slacpy_pivot(const PLASMA_desc descA, PLASMA_enum direct, int k1, int k2, const int *ipiv, int *rankin, int *rankout, float *A, int lda, int init)
Definition: core_slacpy_pivot.c:84
int CORE_spltmg_hankel(PLASMA_enum uplo, int M, int N, float *A, int LDA, int m0, int n0, int nb, const float *V1, const float *V2)
Definition: core_spltmg_hankel.c:88
void CORE_sgemm(PLASMA_enum transA, PLASMA_enum transB, int M, int N, int K, float alpha, const float *A, int LDA, const float *B, int LDB, float beta, float *C, int LDC)
Definition: core_sgemm.c:90
int CORE_sormqr(PLASMA_enum side, PLASMA_enum trans, int M, int N, int K, int IB, const float *V, int LDV, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_sormqr.c:108
void CORE_slaset2(PLASMA_enum uplo, int n1, int n2, float alpha, float *tileA, int ldtilea)
Definition: core_slaset2.c:55
int CORE_stslqt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_stslqt.c:107
void CORE_slarfy(int N, float *A, int LDA, const float *V, const float *TAU, float *WORK)
Definition: core_slarfy.c:61
int CORE_sgetrf_nopiv(int m, int n, int ib, float *A, int lda)
Definition: core_sgetrf_nopiv.c:69
void CORE_slaed3_reduceW(int n, int n1, int K, int l, const float *Q, int LDQ, const float *Wred, float *W)
Definition: core_slaed3_reduceW.c:60
void CORE_slaed2_computeK(int *K, int n, int n1, float *beta, float *D, float *Q, int LDQ, float *Z, float *DLAMBDA, float *W, int *INDX, int *INDXC, int *INDXP, int *INDXQ, int *COLTYP)
Definition: core_slaed2_computeK.c:104
void CORE_sgetrip(int m, int n, float *A, float *work)
Definition: core_sgetrip.c:51
int CORE_shbelr(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_shbelr.c:80
void CORE_spltmg_toeppd1(int gM, int m0, int M, float *W, unsigned long long int seed)
Definition: core_spltmg_toeppd.c:70
int CORE_sormlq(PLASMA_enum side, PLASMA_enum trans, int M, int N, int IB, int K, const float *V, int LDV, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_sormlq.c:108
int CORE_slascl(PLASMA_enum type, int kl, int ku, float cfrom, float cto, int m, int n, float *A, int lda)
Definition: core_slascl.c:77
int CORE_sttlqt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sttlqt.c:116
void CORE_splgsy(float bump, int m, int n, float *A, int lda, int bigM, int m0, int n0, unsigned long long int seed)
Definition: core_splgsy.c:72
void CORE_sgemv(PLASMA_enum trans, int M, int N, float alpha, const float *A, int LDA, const float *x, int incx, float beta, float *y, int incy)
Definition: core_sgemv.c:78
int CORE_slarfb_gemm(PLASMA_enum side, PLASMA_enum trans, PLASMA_enum direct, PLASMA_enum storev, int M, int N, int K, const float *V, int LDV, const float *T, int LDT, float *C, int LDC, float *WORK, int LDWORK)
Definition: core_slarfb_gemm.c:113
void CORE_ssetvar(const float *alpha, float *x)
Definition: core_ssetvar.c:37
int CORE_stsmlq_sytra1(PLASMA_enum side, PLASMA_enum trans, int m1, int n1, int m2, int n2, int k, int ib, float *A1, int lda1, float *A2, int lda2, const float *V, int ldv, const float *T, int ldt, float *WORK, int ldwork)
Definition: core_stsmlq_sytra1.c:125
int CORE_slaswpc_ontile(PLASMA_desc descA, int i1, int i2, const int *ipiv, int inc)
Definition: core_slaswp.c:296
int CORE_spemv(PLASMA_enum trans, PLASMA_enum storev, int M, int N, int L, float ALPHA, const float *A, int LDA, const float *X, int INCX, float BETA, float *Y, int INCY, float *WORK)
Definition: core_spemv.c:118
int CORE_sgelqt(int M, int N, int IB, float *A, int LDA, float *T, int LDT, float *TAU, float *WORK)
Definition: core_sgelqt.c:85
Definition: plasma.h:24
void CORE_sgbtype2cb(PLASMA_enum uplo, int N, int NB, float *A, int LDA, float *VQ, float *TAUQ, float *VP, float *TAUP, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_sgbtype2cb.c:129
int CORE_slaed4(int n, int K, float *D, float beta, float *Q, int LDQ, const float *D0, const float *Z, const int *INDX, int start, int end)
Definition: core_slaed4.c:75
int CORE_sstedc(PLASMA_enum compz, int n, float *D, float *E, float *Z, int LDZ, float *WORK, int LWORK, int *IWORK, int LIWORK)
Definition: core_sstedc.c:85
void CORE_slaswp(int N, float *A, int LDA, int I1, int I2, const int *IPIV, int INC)
Definition: core_slaswp.c:62
int CORE_stsqrt(int M, int N, int IB, float *A1, int LDA1, float *A2, int LDA2, float *T, int LDT, float *TAU, float *WORK)
Definition: core_stsqrt.c:97
void CORE_strtri(PLASMA_enum uplo, PLASMA_enum diag, int N, float *A, int LDA, int *info)
Definition: core_strtri.c:66
void CORE_ssymm(PLASMA_enum side, PLASMA_enum uplo, int M, int N, float alpha, const float *A, int LDA, const float *B, int LDB, float beta, float *C, int LDC)
Definition: core_ssymm.c:88
void CORE_sasum(int storev, PLASMA_enum uplo, int M, int N, const float *A, int lda, float *work)
Definition: core_sasum.c:61
int CORE_sssssm(int M1, int N1, int M2, int N2, int K, int IB, float *A1, int LDA1, float *A2, int LDA2, const float *L1, int LDL1, const float *L2, int LDL2, const int *IPIV)
Definition: core_sssssm.c:94
void CORE_slaed3_computevectors(int K, int il_nondef, int iu_nondef, float *Q, int LDQ, float *W, float *S, const int *INDXC, int start, int end)
Definition: core_slaed3_computevectors.c:74
void CORE_slacpy(PLASMA_enum uplo, int M, int N, const float *A, int LDA, float *B, int LDB)
Definition: core_slacpy.c:59
Definition: descriptor.h:41
void CORE_spltmg_fiedler(int m, int n, const float *X, int incX, const float *Y, int incY, float *A, int lda)
Definition: core_spltmg_fiedler.c:75
void CORE_slansy(int norm, PLASMA_enum uplo, int N, const float *A, int LDA, float *work, float *normA)
Definition: core_slansy.c:74
void CORE_spltmg_toeppd2(int M, int N, int K, int m0, int n0, const float *W, float *A, int LDA)
Definition: core_spltmg_toeppd.c:149
int CORE_spltmg_circul(int M, int N, float *A, int LDA, int gM, int m0, int n0, const float *V)
Definition: core_spltmg_circul.c:76
int CORE_sgblrx(PLASMA_enum uplo, int N, PLASMA_desc *A, float *V, float *TAU, int st, int ed, int eltsize)
Definition: core_sgblrx.c:80
void CORE_sswpab(int i, int n1, int n2, float *A, float *work)
Definition: core_sswpab.c:63
int CORE_slascal(PLASMA_enum uplo, int m, int n, float alpha, float *A, int lda)
Definition: core_slascal.c:52
int CORE_sgeadd(PLASMA_enum trans, int M, int N, float alpha, const float *A, int LDA, float beta, float *B, int LDB)
Definition: core_sgeadd.c:75
int CORE_ststrf(int M, int N, int IB, int NB, float *U, int LDU, float *A, int LDA, float *L, int LDL, int *IPIV, float *WORK, int LDWORK, int *INFO)
Definition: core_ststrf.c:99
void CORE_sgeqp3_init(int n, int *jpvt)
Definition: core_sgeqp3_init.c:38
int CORE_ssteqr(PLASMA_enum compz, int n, float *D, float *E, float *Z, int LDZ, float *WORK)
Definition: core_ssteqr.c:66
void CORE_ssyr2k(PLASMA_enum uplo, PLASMA_enum trans, int N, int K, float alpha, const float *A, int LDA, const float *B, int LDB, float beta, float *C, int LDC)
Definition: core_ssyr2k.c:90
void CORE_sgbtype3cb(PLASMA_enum uplo, int N, int NB, float *A, int LDA, float *VQ, float *TAUQ, float *VP, float *TAUP, int st, int ed, int sweep, int Vblksiz, int WANTZ, float *WORK)
Definition: core_sgbtype3cb.c:124
int CORE_sgetrf(int M, int N, float *A, int LDA, int *IPIV, int *INFO)
Definition: core_sgetrf.c:60