|
PLASMA 2.3.1
|
00001 00017 /***************************************************************************/ 00020 #define plasma_ddesc_alloc( descA, mb, nb, lm, ln, i, j, m, n, free) \ 00021 descA = plasma_desc_init( \ 00022 PlasmaRealDouble, (mb), (nb), ((mb)*(nb)), \ 00023 (m), (n), (i), (j), (m), (n)); \ 00024 if ( plasma_desc_mat_alloc( &(descA) ) ) { \ 00025 plasma_error( __func__, "plasma_shared_alloc() failed"); \ 00026 {free;}; \ 00027 return PLASMA_ERR_OUT_OF_RESOURCES; \ 00028 } 00029 00030 #define plasma_dooplap2tile( descA, A, mb, nb, lm, ln, i, j, m, n, free) \ 00031 descA = plasma_desc_init( \ 00032 PlasmaRealDouble, (mb), (nb), ((mb)*(nb)), \ 00033 (lm), (ln), (i), (j), (m), (n)); \ 00034 if ( plasma_desc_mat_alloc( &(descA) ) ) { \ 00035 plasma_error( __func__, "plasma_shared_alloc() failed"); \ 00036 {free;}; \ 00037 return PLASMA_ERR_OUT_OF_RESOURCES; \ 00038 } \ 00039 plasma_parallel_call_5( \ 00040 plasma_pdlapack_to_tile, \ 00041 double*, (A), \ 00042 int, (lm), \ 00043 PLASMA_desc, (descA), \ 00044 PLASMA_sequence*, sequence, \ 00045 PLASMA_request*, &request); 00046 00047 #define plasma_diplap2tile( descA, A, mb, nb, lm, ln, i, j, m, n) \ 00048 descA = plasma_desc_init( \ 00049 PlasmaRealDouble, (mb), (nb), ((mb)*(nb)), \ 00050 (lm), (ln), (i), (j), (m), (n)); \ 00051 descA.mat = A; \ 00052 PLASMA_dgecfi_Async((lm), (ln), (A), PlasmaCM, (mb), (nb), \ 00053 PlasmaCCRB, (mb), (nb), sequence, &request); 00054 00055 00056 00057 #define plasma_dooptile2lap( descA, A, mb, nb, lm, ln) \ 00058 plasma_parallel_call_5(plasma_pdtile_to_lapack, \ 00059 PLASMA_desc, (descA), \ 00060 double*, (A), \ 00061 int, (lm), \ 00062 PLASMA_sequence*, sequence, \ 00063 PLASMA_request*, &request); 00064 00065 #define plasma_diptile2lap( descA, A, mb, nb, lm, ln) \ 00066 PLASMA_dgecfi_Async((lm), (ln), (A), PlasmaCCRB, (mb), (nb), \ 00067 PlasmaCM, (mb), (nb), sequence, &request); 00068 00069 /***************************************************************************/ 00072 void plasma_pdaxpy (plasma_context_t *plasma); 00073 void plasma_pdgelqf (plasma_context_t *plasma); 00074 void plasma_pdgemm (plasma_context_t *plasma); 00075 void plasma_pdgeqrf (plasma_context_t *plasma); 00076 void plasma_pdgerbb (plasma_context_t *plasma); 00077 void plasma_pdgetmi2(plasma_context_t *plasma); 00078 void plasma_pdgetrf_incpiv(plasma_context_t *plasma); 00079 #ifdef COMPLEX 00080 void plasma_pdsymm (plasma_context_t *plasma); 00081 void plasma_pdsyrk (plasma_context_t *plasma); 00082 void plasma_pdsyr2k (plasma_context_t *plasma); 00083 #endif 00084 void plasma_pdlacpy (plasma_context_t *plasma); 00085 void plasma_pdlag2s (plasma_context_t *plasma); 00086 void plasma_pdlange (plasma_context_t *plasma); 00087 #ifdef COMPLEX 00088 void plasma_pdlansy (plasma_context_t *plasma); 00089 #endif 00090 void plasma_pdlansy (plasma_context_t *plasma); 00091 void plasma_pdpack (plasma_context_t *plasma); 00092 void plasma_pdplgsy (plasma_context_t *plasma); 00093 void plasma_pdplgsy (plasma_context_t *plasma); 00094 void plasma_pdplrnt (plasma_context_t *plasma); 00095 void plasma_pdpotrf (plasma_context_t *plasma); 00096 void plasma_pdshift (plasma_context_t *plasma); 00097 void plasma_pdsymm (plasma_context_t *plasma); 00098 void plasma_pdsyrk (plasma_context_t *plasma); 00099 void plasma_pdsyr2k (plasma_context_t *plasma); 00100 void plasma_pdtrmm (plasma_context_t *plasma); 00101 void plasma_pdtrsm (plasma_context_t *plasma); 00102 void plasma_pdtrsmpl(plasma_context_t *plasma); 00103 void plasma_pdorglq (plasma_context_t *plasma); 00104 void plasma_pdorgqr (plasma_context_t *plasma); 00105 void plasma_pdorgqrrh(plasma_context_t *plasma); 00106 void plasma_pdormlq (plasma_context_t *plasma); 00107 void plasma_pdormqr (plasma_context_t *plasma); 00108 void plasma_pdunpack(plasma_context_t *plasma); 00109 00110 /***************************************************************************/ 00113 int plasma_dshift(plasma_context_t *plasma, int m, int n, double *A, 00114 int nprob, int me, int ne, int L, 00115 PLASMA_sequence *sequence, PLASMA_request *request); 00116 00117 /***************************************************************************/ 00120 void plasma_pdaxpy_quark(double alpha, PLASMA_desc A, PLASMA_desc B, PLASMA_sequence *sequence, PLASMA_request *request); 00121 void plasma_pdbarrier_tl2pnl_quark(PLASMA_desc A, PLASMA_sequence *sequence, PLASMA_request *request); 00122 void plasma_pdbarrier_pnl2tl_quark(PLASMA_desc A, PLASMA_sequence *sequence, PLASMA_request *request); 00123 void plasma_pdgelqf_quark(PLASMA_desc A, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00124 void plasma_pdgelqfrh_quark(PLASMA_desc A, PLASMA_desc T, int BS, PLASMA_sequence *sequence, PLASMA_request *request); 00125 void plasma_pdgemm_quark(PLASMA_enum transA, PLASMA_enum transB, double alpha, PLASMA_desc A, PLASMA_desc B, double beta, PLASMA_desc C, PLASMA_sequence *sequence, PLASMA_request *request); 00126 void plasma_pdgeqrf_quark(PLASMA_desc A, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00127 void plasma_pdgeqrfrh_quark(PLASMA_desc A, PLASMA_desc T, int BS, PLASMA_sequence *sequence, PLASMA_request *request); 00128 void plasma_pdgerbh_quark(PLASMA_desc A, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00129 void plasma_pdgerbb_quark(PLASMA_desc A, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00130 void plasma_pdgerbbrh_quark(PLASMA_desc A, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00131 void plasma_pdgetmi2_quark(PLASMA_enum idep, PLASMA_enum odep, PLASMA_enum storev, int m, int n, int mb, int nb, double *A, PLASMA_sequence *sequence, PLASMA_request *request); 00132 void plasma_pdgetrf_incpiv_quark(PLASMA_desc A, PLASMA_desc L, int *IPIV, PLASMA_sequence *sequence, PLASMA_request *request); 00133 void plasma_pdgetrf_reclap_quark(PLASMA_desc A, int *IPIV, PLASMA_sequence *sequence, PLASMA_request *request); 00134 void plasma_pdgetrf_rectil_quark(PLASMA_desc A, int *IPIV, PLASMA_sequence *sequence, PLASMA_request *request); 00135 #ifdef COMPLEX 00136 void plasma_pdsygst_quark(PLASMA_enum itype, PLASMA_enum uplo, PLASMA_desc A, PLASMA_desc B, PLASMA_sequence *sequence, PLASMA_request *request); 00137 void plasma_pdsymm_quark(PLASMA_enum side, PLASMA_enum uplo, double alpha, PLASMA_desc A, PLASMA_desc B, double beta, PLASMA_desc C, PLASMA_sequence *sequence, PLASMA_request *request); 00138 void plasma_pdsyrk_quark(PLASMA_enum uplo, PLASMA_enum trans, double alpha, PLASMA_desc A, double beta, PLASMA_desc C, PLASMA_sequence *sequence, PLASMA_request *request); 00139 void plasma_pdsyr2k_quark(PLASMA_enum uplo, PLASMA_enum trans, double alpha, PLASMA_desc A, PLASMA_desc B, double beta, PLASMA_desc C, PLASMA_sequence *sequence, PLASMA_request *request); 00140 void plasma_pdsyrbt_quark(PLASMA_enum uplo, PLASMA_desc A, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00141 void plasma_pdgbrdb_quark(PLASMA_enum uplo, PLASMA_desc A, double *D, double *E, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00142 void plasma_pdsbrdt_quark(PLASMA_enum uplo, PLASMA_desc A, double *D, double *E, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00143 #endif 00144 void plasma_pdlacpy_quark(PLASMA_enum uplo, PLASMA_desc A, PLASMA_desc B, PLASMA_sequence *sequence, PLASMA_request *request); 00145 void plasma_pdlag2s_quark(PLASMA_desc A, PLASMA_desc SB, PLASMA_sequence *sequence, PLASMA_request *request); 00146 void plasma_pdlange_quark(PLASMA_enum norm, PLASMA_desc A, double *work, double *result, PLASMA_sequence *sequence, PLASMA_request *request); 00147 #ifdef COMPLEX 00148 void plasma_pdlansy_quark(PLASMA_enum norm, PLASMA_enum uplo, PLASMA_desc A, double *work, double *result, PLASMA_sequence *sequence, PLASMA_request *request); 00149 #endif 00150 void plasma_pdlansy_quark(PLASMA_enum norm, PLASMA_enum uplo, PLASMA_desc A, double *work, double *result, PLASMA_sequence *sequence, PLASMA_request *request); 00151 void plasma_pdlaset_quark( PLASMA_enum uplo, double alpha, double beta, PLASMA_desc A, PLASMA_sequence *sequence, PLASMA_request *request); 00152 void plasma_pdlaset2_quark(PLASMA_enum uplo, double alpha, PLASMA_desc A, PLASMA_sequence *sequence, PLASMA_request *request); 00153 void plasma_pdlaswp_quark(PLASMA_desc B, int *IPIV, int inc, PLASMA_sequence *sequence, PLASMA_request *request); 00154 void plasma_pdlauum_quark(PLASMA_enum uplo, PLASMA_desc A, PLASMA_sequence *sequence, PLASMA_request *request); 00155 void plasma_pdplgsy_quark(double bump, PLASMA_desc A, unsigned long long int seed, PLASMA_sequence *sequence, PLASMA_request *request); 00156 void plasma_pdplgsy_quark(double bump, PLASMA_desc A, unsigned long long int seed, PLASMA_sequence *sequence, PLASMA_request *request ); 00157 void plasma_pdplrnt_quark(PLASMA_desc A, unsigned long long int seed, PLASMA_sequence *sequence, PLASMA_request *request ); 00158 void plasma_pdpotrf_quark(PLASMA_enum uplo, PLASMA_desc A, PLASMA_sequence *sequence, PLASMA_request *request); 00159 void plasma_pdshift_quark(int, int, int, double *, int *, int, int, PLASMA_sequence*, PLASMA_request*); 00160 void plasma_pdsymm_quark(PLASMA_enum side, PLASMA_enum uplo, double alpha, PLASMA_desc A, PLASMA_desc B, double beta, PLASMA_desc C, PLASMA_sequence *sequence, PLASMA_request *request); 00161 void plasma_pdsyrk_quark(PLASMA_enum uplo, PLASMA_enum trans, double alpha, PLASMA_desc A, double beta, PLASMA_desc C, PLASMA_sequence *sequence, PLASMA_request *request); 00162 void plasma_pdsyr2k_quark(PLASMA_enum uplo, PLASMA_enum trans, double alpha, PLASMA_desc A, PLASMA_desc B, double beta, PLASMA_desc C, PLASMA_sequence *sequence, PLASMA_request *request); 00163 void plasma_pdtrmm_quark(PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag, double alpha, PLASMA_desc A, PLASMA_desc B, PLASMA_sequence *sequence, PLASMA_request *request); 00164 void plasma_pdtrsm_quark(PLASMA_enum side, PLASMA_enum uplo, PLASMA_enum transA, PLASMA_enum diag, double alpha, PLASMA_desc A, PLASMA_desc B, PLASMA_sequence *sequence, PLASMA_request *request); 00165 void plasma_pdtrsmpl_quark(PLASMA_desc A, PLASMA_desc B, PLASMA_desc L, int *IPIV, PLASMA_sequence *sequence, PLASMA_request *request); 00166 void plasma_pdtrtri_quark(PLASMA_enum uplo, PLASMA_enum diag, PLASMA_desc A, PLASMA_sequence *sequence, PLASMA_request *request); 00167 void plasma_pdorgbr_quark(PLASMA_enum side, PLASMA_desc A, PLASMA_desc O, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00168 void plasma_pdorgbrrh_quark(PLASMA_enum side, PLASMA_desc A, PLASMA_desc O, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00169 void plasma_pdorgqr_quark(PLASMA_desc A, PLASMA_desc Q, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00170 void plasma_pdorgqrrh_quark(PLASMA_desc A, PLASMA_desc Q, PLASMA_desc T, int BS, PLASMA_sequence *sequence, PLASMA_request *request); 00171 void plasma_pdorglq_quark(PLASMA_desc A, PLASMA_desc Q, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00172 void plasma_pdorglqrh_quark(PLASMA_desc A, PLASMA_desc Q, PLASMA_desc T, int BS, PLASMA_sequence *sequence, PLASMA_request *request); 00173 void plasma_pdorgtr_quark(PLASMA_enum uplo, PLASMA_desc A, PLASMA_desc Q, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00174 void plasma_pdormqr_quark(PLASMA_enum side, PLASMA_enum trans, PLASMA_desc A, PLASMA_desc B, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00175 void plasma_pdormqrrh_quark(PLASMA_enum side, PLASMA_enum trans, PLASMA_desc A, PLASMA_desc B, PLASMA_desc T, int BS, PLASMA_sequence *sequence, PLASMA_request *request); 00176 void plasma_pdormlq_quark(PLASMA_enum side, PLASMA_enum trans, PLASMA_desc A, PLASMA_desc B, PLASMA_desc T, PLASMA_sequence *sequence, PLASMA_request *request); 00177 void plasma_pdormlqrh_quark(PLASMA_enum side, PLASMA_enum trans, PLASMA_desc A, PLASMA_desc B, PLASMA_desc T, int BS, PLASMA_sequence *sequence, PLASMA_request *request);
1.7.3