28 #define max(a, b) ((a) > (b) ? (a) : (b))
31 #define min(a, b) ((a) < (b) ? (a) : (b))
34 int check_solution(
int,
int,
int,
double*,
int,
double*,
double*,
int);
53 int LDBxNRHS = LDB*NRHS;
55 double *A1 = (
double *)malloc(LDA*N*
sizeof(
double));
56 double *A2 = (
double *)malloc(LDA*N*
sizeof(
double));
57 double *B1 = (
double *)malloc(LDB*NRHS*
sizeof(
double));
58 double *B2 = (
double *)malloc(LDB*NRHS*
sizeof(
double));
62 if ((!A1)||(!A2)||(!B1)||(!B2)){
63 printf(
"Out of Memory \n ");
69 printf(
"-- PLASMA is initialized to run on %d cores. \n",cores);
75 LAPACKE_dlarnv_work(
IONE,
ISEED, LDAxN, A1);
76 for (i = 0; i < M; i++)
77 for (j = 0; j < N; j++)
78 A2[LDA*j+i] = A1[LDA*j+i] ;
81 LAPACKE_dlarnv_work(
IONE,
ISEED, LDBxNRHS, B1);
82 for (i = 0; i < M; i++)
83 for (j = 0; j < NRHS; j++)
84 B2[LDB*j+i] = B1[LDB*j+i] ;
92 if ((info_solution != 0)|(info != 0))
93 printf(
"-- Error in DGELS example ! \n");
95 printf(
"-- Run of DGELS example successful ! \n");
97 free(A1); free(A2); free(B1); free(B2); free(T);
108 int check_solution(
int M,
int N,
int NRHS,
double *A1,
int LDA,
double *B1,
double *B2,
int LDB)
111 double Rnorm, Anorm, Xnorm, Bnorm;
113 double *work = (
double *)malloc(
max(M, N)*
sizeof(double));
116 eps = LAPACKE_dlamch_work(
'e');
125 cblas_dgemm(
CblasColMajor,
CblasNoTrans,
CblasNoTrans, M, NRHS, N, (alpha), A1, LDA, B2, LDB, (beta), B1, LDB);
128 double *Residual = (
double *)malloc(M*NRHS*
sizeof(
double));
129 memset((
void*)Residual, 0, M*NRHS*
sizeof(
double));
130 cblas_dgemm(
CblasColMajor,
CblasTrans,
CblasNoTrans, N, NRHS, M, (alpha), A1, LDA, B1, LDB, (beta), Residual, M);
135 double *Residual = (
double *)malloc(N*NRHS*
sizeof(
double));
136 memset((
void*)Residual, 0, N*NRHS*
sizeof(
double));
137 cblas_dgemm(
CblasColMajor,
CblasTrans,
CblasNoTrans, N, NRHS, M, (alpha), A1, LDA, B1, LDB, (beta), Residual, N);
142 printf(
"============\n");
143 printf(
"Checking the Residual of the solution \n");
144 printf(
"-- ||Ax-B||_oo/((||A||_oo||x||_oo+||B||)_oo.N.eps) = %e \n",Rnorm/((Anorm*Xnorm+Bnorm)*N*eps));
146 if (isnan(Rnorm / ((Anorm * Xnorm + Bnorm) * N * eps)) || (Rnorm / ((Anorm * Xnorm + Bnorm) * N * eps) > 10.0) ) {
147 printf(
"-- The solution is suspicious ! \n");
151 printf(
"-- The solution is CORRECT ! \n");
157 return info_solution;