Code: Select all
compile errors on device 0:
----
compile errors on device 0:
----
compile errors on device 0:
----
compile errors on device 0:
...
Code: Select all
compile errors on device 0:
----
compile errors on device 0:
----
compile errors on device 0:
----
compile errors on device 0:
...
Code: Select all
magma_init()Code: Select all
clmagma-1.3.0/testing> echo $clBLAS
/usr/local/clBLAS-2.4
clmagma-1.3.0/testing> setenv LD_LIBRARY_PATH ${LD_LIBRARY_PATH}:${HOME}/src/clmagma-1.3.0/lib
clmagma-1.3.0/testing> ./testing_dpotrf --range 100:1000:100 -c
% clMAGMA 1.3.0
% OpenCL platform OpenCL 1.2 (Nov 2 2015 15:02:14). MAGMA not compiled with OpenMP.
% Device: GeForce GT 750M, 2048.0 MiB memory, max allocation 512.0 MiB, driver 8.26.29 310.40.55f01
Usage: ./testing_dpotrf [options] [-h|--help]
ngpu = 1, uplo = Lower
N CPU GFlop/s (sec) GPU GFlop/s (sec) ||R_magma - R_lapack||_F / ||R_lapack||_F
========================================================
100 6.51 ( 0.00) 3.59 ( 0.00) 0.00e+00 ok
200 5.69 ( 0.00) 0.16 ( 0.02) 4.54e-17 ok
300 11.32 ( 0.00) 0.54 ( 0.02) 8.64e-17 ok
400 19.67 ( 0.00) 0.80 ( 0.03) 6.89e-17 ok
500 23.42 ( 0.00) 1.29 ( 0.03) 6.71e-17 ok
600 38.62 ( 0.00) 1.76 ( 0.04) 7.85e-17 ok
700 38.04 ( 0.00) 1.86 ( 0.06) 7.52e-17 ok
800 37.69 ( 0.00) 1.93 ( 0.09) 6.77e-17 ok
900 53.26 ( 0.00) 2.29 ( 0.11) 6.33e-17 ok
1000 55.19 ( 0.01) 2.75 ( 0.12) 5.97e-17 ok
Code: Select all
./testing_dpotrf --range 100:1000:100 -c
compile errors on device 0:
----
compile errors on device 0:
... repeated many times
----
% clMAGMA 1.3.0 svn
% OpenCL platform OpenCL 1.2 CUDA 7.5.26. OpenMP threads 4.
% Device: GeForce GTX 970, 4095.3 MiB memory, max allocation 1023.8 MiB, driver 352.93
% Usage: ./testing_dpotrf [options] [-h|--help]
% ngpu = 1, uplo = Lower
% N CPU GFlop/s (sec) GPU GFlop/s (sec) ||R_magma - R_lapack||_F / ||R_lapack||_F
%=======================================================
100 1.84 ( 0.00) 0.01 ( 0.04) 0.00e+00 ok
dtrsm( R, L, C, N, 72, 128, 224, 224 )
dtrsm done
200 6.09 ( 0.00) 0.02 ( 0.13) 8.30e-18 ok
dtrsm( R, L, C, N, 172, 128, 320, 320 )
dtrsm done
dtrsm( R, L, C, N, 44, 128, 320, 320 )
dtrsm done
300 12.39 ( 0.00) 0.03 ( 0.29) 3.64e-17 ok
dtrsm( R, L, C, N, 272, 128, 416, 416 )
dtrsm done
dtrsm( R, L, C, N, 144, 128, 416, 416 )
dtrsm done
dtrsm( R, L, C, N, 16, 128, 416, 416 )
dtrsm done
400 18.10 ( 0.00) 3.34 ( 0.01) 3.59e-17 ok
dtrsm( R, L, C, N, 372, 128, 512, 512 )
dtrsm done
dtrsm( R, L, C, N, 244, 128, 512, 512 )
dtrsm done
dtrsm( R, L, C, N, 116, 128, 512, 512 )
dtrsm done
500 25.04 ( 0.00) 5.60 ( 0.01) 3.16e-17 ok
dtrsm( R, L, C, N, 472, 128, 608, 608 )
dtrsm done
dtrsm( R, L, C, N, 344, 128, 608, 608 )
dtrsm done
dtrsm( R, L, C, N, 216, 128, 608, 608 )
dtrsm done
dtrsm( R, L, C, N, 88, 128, 608, 608 )
dtrsm done
600 30.72 ( 0.00) 12.49 ( 0.01) 4.25e-17 ok
dtrsm( R, L, C, N, 572, 128, 704, 704 )
dtrsm done
dtrsm( R, L, C, N, 444, 128, 704, 704 )
dtrsm done
dtrsm( R, L, C, N, 316, 128, 704, 704 )
dtrsm done
dtrsm( R, L, C, N, 188, 128, 704, 704 )
dtrsm done
dtrsm( R, L, C, N, 60, 128, 704, 704 )
dtrsm done
700 17.74 ( 0.01) 14.63 ( 0.01) 4.04e-17 ok
dtrsm( R, L, C, N, 672, 128, 800, 800 )
dtrsm done
dtrsm( R, L, C, N, 544, 128, 800, 800 )
dtrsm done
dtrsm( R, L, C, N, 416, 128, 800, 800 )
dtrsm done
dtrsm( R, L, C, N, 288, 128, 800, 800 )
dtrsm done
dtrsm( R, L, C, N, 160, 128, 800, 800 )
dtrsm done
dtrsm( R, L, C, N, 32, 128, 800, 800 )
dtrsm done
800 23.85 ( 0.01) 1.52 ( 0.11) 4.37e-17 ok
dtrsm( R, L, C, N, 772, 128, 928, 928 )
dtrsm done
dtrsm( R, L, C, N, 644, 128, 928, 928 )
dtrsm done
dtrsm( R, L, C, N, 516, 128, 928, 928 )
dtrsm done
dtrsm( R, L, C, N, 388, 128, 928, 928 )
dtrsm done
dtrsm( R, L, C, N, 260, 128, 928, 928 )
dtrsm done
dtrsm( R, L, C, N, 132, 128, 928, 928 )
dtrsm done
dtrsm( R, L, C, N, 4, 128, 928, 928 )
dtrsm done
900 43.13 ( 0.01) 15.08 ( 0.02) 3.97e-17 ok
dtrsm( R, L, C, N, 872, 128, 1024, 1024 )
dtrsm done
dtrsm( R, L, C, N, 744, 128, 1024, 1024 )
dtrsm done
dtrsm( R, L, C, N, 616, 128, 1024, 1024 )
dtrsm done
dtrsm( R, L, C, N, 488, 128, 1024, 1024 )
dtrsm done
dtrsm( R, L, C, N, 360, 128, 1024, 1024 )
dtrsm done
dtrsm( R, L, C, N, 232, 128, 1024, 1024 )
dtrsm done
dtrsm( R, L, C, N, 104, 128, 1024, 1024 )
dtrsm done
1000 42.20 ( 0.01) 18.55 ( 0.02) 3.77e-17 ok
Code: Select all
mint clmagma-1.3.0/testing> ./testing_dpotrf --range 100:1000:100 -c Error: file 'clmagma_kernels.co' not found in $LD_LIBRARY_PATH '/Users/mgates/src/hadoop-2.6.0/lib:/Users/mgates/Documents/cl-magma/lib:/usr/local/openblas/lib:/usr/local/cuda-7.5/lib:/usr/local/cuda-7.5/extras/CUPTI/lib:/usr/local/openmpi/lib'
% clMAGMA 1.3.0
% OpenCL platform OpenCL 1.2 (Nov 2 2015 15:02:14). MAGMA not compiled with OpenMP.
% Device: GeForce GT 750M, 2048.0 MiB memory, max allocation 512.0 MiB, driver 8.26.29 310.40.55f01
Usage: ./testing_dpotrf [options] [-h|--help]
ngpu = 1, uplo = Lower
N CPU GFlop/s (sec) GPU GFlop/s (sec) ||R_magma - R_lapack||_F / ||R_lapack||_F
========================================================
100 6.66 ( 0.00) 3.49 ( 0.00) 0.00e+00 ok
OpenCL runtime error: unknown OpenCL error code (-1017) in magma_dsyrk at blas_d.cpp:1268
200 6.48 ( 0.00) 0.26 ( 0.01) 4.54e-17 ok
OpenCL runtime error: unknown OpenCL error code (-1017) in magma_dsyrk at blas_d.cpp:1268
300 15.81 ( 0.00) 0.86 ( 0.01) 8.64e-17 ok
OpenCL runtime error: unknown OpenCL error code (-1017) in magma_dsyrk at blas_d.cpp:1268
400 22.90 ( 0.00) 1.14 ( 0.02) 6.89e-17 ok
Code: Select all
mint clmagma-1.3.0/testing> ./testing_dpotrf --range 100:400:100 -c
Error: file 'clmagma_kernels.co' not found in $LD_LIBRARY_PATH '.'
% clMAGMA 1.3.0
% OpenCL platform OpenCL 1.2 (Nov 2 2015 15:02:14). MAGMA not compiled with OpenMP.
% Device: GeForce GT 750M, 2048.0 MiB memory, max allocation 512.0 MiB, driver 8.26.29 310.40.55f01
Usage: ./testing_dpotrf [options] [-h|--help]
ngpu = 1, uplo = Lower
N CPU GFlop/s (sec) GPU GFlop/s (sec) ||R_magma - R_lapack||_F / ||R_lapack||_F
========================================================
100 5.57 ( 0.00) 2.96 ( 0.00) 0.00e+00 ok
200 6.37 ( 0.00) 0.19 ( 0.01) 4.54e-17 ok
300 12.44 ( 0.00) 0.55 ( 0.02) 8.64e-17 ok
400 19.29 ( 0.00) 0.69 ( 0.03) 6.89e-17 ok
mint clmagma-1.3.0/testing> setenv LD_LIBRARY_PATH ../lib
mint clmagma-1.3.0/testing> ./testing_dpotrf --range 100:400:100 -c
% clMAGMA 1.3.0
% OpenCL platform OpenCL 1.2 (Nov 2 2015 15:02:14). MAGMA not compiled with OpenMP.
% Device: GeForce GT 750M, 2048.0 MiB memory, max allocation 512.0 MiB, driver 8.26.29 310.40.55f01
Usage: ./testing_dpotrf [options] [-h|--help]
ngpu = 1, uplo = Lower
N CPU GFlop/s (sec) GPU GFlop/s (sec) ||R_magma - R_lapack||_F / ||R_lapack||_F
========================================================
100 3.64 ( 0.00) 1.93 ( 0.00) 0.00e+00 ok
200 4.52 ( 0.00) 0.17 ( 0.02) 4.54e-17 ok
300 11.61 ( 0.00) 0.56 ( 0.02) 8.64e-17 ok
400 19.20 ( 0.00) 0.70 ( 0.03) 6.89e-17 ok