plasma/docs/dchkge_8f_source.html

      SUBROUTINE dchkge( DOTYPE, NM, MVAL, NN, NVAL, NNB, NBVAL, NNS,

     $                   ibval, nsval, thresh, tsterr, nmax, a, afac,

     $                   ainv, b, x, xact, work, rwork, iwork, nout )

*

      include 'plasmaf.h'

*

*  -- LAPACK test routine (version 3.1.1) --

*     Univ. of Tennessee, Univ. of California Berkeley and NAG Ltd..

*     January 2007

*

*     .. Scalar Arguments ..

      LOGICAL            tsterr

      INTEGER            nm, nmax, nn, nnb, nns, nout

      DOUBLE PRECISION   thresh

*     ..

*     .. Array Arguments ..

      LOGICAL            dotype( * )

      INTEGER            ibval( * ), iwork( * ), mval( * ), nbval( * ),

     $                   nsval( * ), nval( * )

      DOUBLE PRECISION   a( * ), afac( * ), ainv( * ), b( * ),

     $                   rwork( * ), work( * ), x( * ), xact( * )

*     ..

*

*  Purpose

*  =======

*

*  DCHKGE tests DGETRF, -TRI, -TRS, -RFS, and -CON.

*

*  Arguments

*  =========

*

*  DOTYPE  (input) LOGICAL array, dimension (NTYPES)

*          The matrix types to be used for testing.  Matrices of type j

*          (for 1 <= j <= NTYPES) are used for testing if DOTYPE(j) =

*          .TRUE.; if DOTYPE(j) = .FALSE., then type j is not used.

*

*  NM      (input) INTEGER

*          The number of values of M contained in the vector MVAL.

*

*  MVAL    (input) INTEGER array, dimension (NM)

*          The values of the matrix row dimension M.

*

*  NN      (input) INTEGER

*          The number of values of N contained in the vector NVAL.

*

*  NVAL    (input) INTEGER array, dimension (NN)

*          The values of the matrix column dimension N.

*

*  NNB     (input) INTEGER

*          The number of values of NB contained in the vector NBVAL.

*

*  NBVAL   (input) INTEGER array, dimension (NBVAL)

*          The values of the tile size NB.

*

*  IBVAL   (input) INTEGER array, dimension (NBVAL)

*          The values of the inner block size IB.

*

*  NNS     (input) INTEGER

*          The number of values of NRHS contained in the vector NSVAL.

*

*  NSVAL   (input) INTEGER array, dimension (NNS)

*          The values of the number of right hand sides NRHS.

*

*  THRESH  (input) DOUBLE PRECISION

*          The threshold value for the test ratios.  A result is

*          included in the output file if RESULT >= THRESH.  To have

*          every test ratio printed, use THRESH = 0.

*

*  TSTERR  (input) LOGICAL

*          Flag that indicates whether error exits are to be tested.

*

*  NMAX    (input) INTEGER

*          The maximum value permitted for M or N, used in dimensioning

*          the work arrays.

*

*  A       (workspace) DOUBLE PRECISION array, dimension (NMAX*NMAX)

*

*  AFAC    (workspace) DOUBLE PRECISION array, dimension (NMAX*NMAX)

*

*  AINV    (workspace) DOUBLE PRECISION array, dimension (NMAX*NMAX)

*

*  B       (workspace) DOUBLE PRECISION array, dimension (NMAX*NSMAX)

*          where NSMAX is the largest entry in NSVAL.

*

*  X       (workspace) DOUBLE PRECISION array, dimension (NMAX*NSMAX)

*

*  XACT    (workspace) DOUBLE PRECISION array, dimension (NMAX*NSMAX)

*

*  WORK    (workspace) DOUBLE PRECISION array, dimension

*                      (NMAX*max(3,NSMAX))

*

*  RWORK   (workspace) DOUBLE PRECISION array, dimension

*                      (max(2*NMAX,2*NSMAX+NWORK))

*

*  IWORK   (workspace) INTEGER array, dimension (2*NMAX)

*

*  NOUT    (input) INTEGER

*          The unit number for output.

*

*  =====================================================================

*

*     .. Parameters ..

      DOUBLE PRECISION   one, zero

      parameter( one = 1.0d+0, zero = 0.0d+0 )

      INTEGER            ntypes

      parameter( ntypes = 11 )

      INTEGER            ntests

      parameter( ntests = 8 )

*     ONLY NOTRANS SUPPORTED !!!

      INTEGER            ntran

      parameter( ntran = 1 )

*     ..

*     .. Local Scalars ..

      LOGICAL            trfcon, zerot

      CHARACTER          dist, norm, trans, type, xtype

      CHARACTER*3        path

      INTEGER            i, im, imat, ib, in, inb, info, ioff, irhs,

     $                   itran, izero, k, kl, ku, lda, lwork, m, mode,

     $                   n, nb, nerrs, nfail, nimat, nrhs, nrun, nt

      DOUBLE PRECISION   ainvnm, anorm, anormi, anormo, cndnum, dummy,

     $                   rcond, rcondc, rcondi, rcondo

      INTEGER            hl( 2 ), hpiv( 2 )

      INTEGER            plasma_trans

*     ..

*     .. Local Arrays ..

      CHARACTER          transs( ntran )

      INTEGER            iseed( 4 ), iseedy( 4 ), plasma_transs( ntran )

      DOUBLE PRECISION   result( ntests )

*     ..

*     .. External Functions ..

      DOUBLE PRECISION   dget06, dlange

      EXTERNAL           dget06, dlange

*     ..

*     .. External Subroutines ..

***      EXTERNAL           ALAERH, ALAHD, ALASUM, DERRGE, DGECON, DGERFS,

***     $                   DGET01 , DGET02, DGET03, DGET04, DGET07, DGETRF,

***     $                   DGETRI, DGETRS, DLACPY, DLARHS, DLASET, DLATB4,

***     $                   DLATMS, DERRGEX, XLAENV

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          max, min

*     ..

*     .. Scalars in Common ..

      LOGICAL            lerr, ok

      CHARACTER*32       srnamt

      INTEGER            infot, nunit

*     ..

*     .. Common blocks ..

      common             / infoc / infot, nunit, ok, lerr

      common             / srnamc / srnamt

*     ..

*     .. Data statements ..

      DATA               iseedy / 1988, 1989, 1990, 1991 / ,

*     $                   TRANSS / 'N', 'T', 'C' /

     $                   transs / 'N' /,

     $                   plasma_transs / plasmanotrans /

*     ..

*     .. Executable Statements ..

*

*     Initialize constants and the random number seed.

*

      path( 1: 1 ) = 'Double precision'

      path( 2: 3 ) = 'GE'

      rcondo = zero

      rcondi = zero

      nrun = 0

      nfail = 0

      nerrs = 0

      DO 10 i = 1, 4

         iseed( i ) = iseedy( i )

   10 continue

*

*     Test the error exits

*

      CALL xlaenv( 1, 1 )

      IF( tsterr )

     $   CALL derrge( path, nout )

      infot = 0

      CALL xlaenv( 2, 2 )

*

*     Do for each value of M in MVAL

*

      DO 120 im = 1, nm

         m = mval( im )

         lda = max( 1, m )

*

*        Do for each value of N in NVAL

*

         DO 110 in = 1, nn

            n = nval( in )

            xtype = 'N'

            nimat = ntypes

            IF( m.LE.0 .OR. n.LE.0 )

     $         nimat = 1

*

            DO 100 imat = 1, nimat

*

*              Do the tests only if DOTYPE( IMAT ) is true.

*

               IF( .NOT.dotype( imat ) )

     $            go to 100

*

*              Skip types 5, 6, or 7 if the matrix size is too small.

*

               zerot = imat.GE.5 .AND. imat.LE.7

               IF( zerot .AND. n.LT.imat-4 )

     $            go to 100

*

*              Set up parameters with DLATB4 and generate a test matrix

*              with DLATMS.

*

               CALL dlatb4( path, imat, m, n, type, kl, ku, anorm, mode,

     $                      cndnum, dist )

*

               srnamt = 'DLATMS'

               CALL dlatms( m, n, dist, iseed, type, rwork, mode,

     $                      cndnum, anorm, kl, ku, 'No packing', a, lda,

     $                      work, info )

*

*              Check error code from DLATMS.

*

               IF( info.NE.0 ) THEN

                  CALL alaerh( path, 'DLATMS', info, 0, ' ', m, n, -1,

     $                         -1, -1, imat, nfail, nerrs, nout )

                  go to 100

               END IF

*

*              For types 5-7, zero one or more columns of the matrix to

*              test that INFO is returned correctly.

*

               IF( zerot ) THEN

                  IF( imat.EQ.5 ) THEN

                     izero = 1

                  ELSE IF( imat.EQ.6 ) THEN

                     izero = min( m, n )

                  ELSE

                     izero = min( m, n ) / 2 + 1

                  END IF

                  ioff = ( izero-1 )*lda

                  IF( imat.LT.7 ) THEN

                     DO 20 i = 1, m

                        a( ioff+i ) = zero

   20                continue

                  ELSE

                     CALL dlaset( 'Full', m, n-izero+1, zero, zero,

     $                            a( ioff+1 ), lda )

                  END IF

               ELSE

                  izero = 0

               END IF

*

*              Do for each blocksize in NBVAL

*

               DO 90 inb = 1, nnb

                  nb = nbval( inb )

                  ib = ibval( inb )

                  CALL xlaenv( 1, nb )

                  IF ( (max(m, n) / 25) .GT. nb ) THEN

                     goto 90

                  END IF

                  CALL plasma_set( plasma_tile_size, nb, info )

                  CALL plasma_set( plasma_inner_block_size, ib, info )

*

*                 ALLOCATE HL and HPIV

*

c$$$                  CALL PLASMA_ALLOC_WORKSPACE_DGETRF_INCPIV(

c$$$     $                 M, N, HL, HPIV, INFO )

*

*                 Compute the LU factorization of the matrix.

*

                  CALL dlacpy( 'Full', m, n, a, lda, afac, lda )

                  srnamt = 'DGETRF'

c$$$                  CALL PLASMA_DGETRF_INCPIV( M, N, AFAC, LDA, HL, HPIV,

c$$$     $                 INFO )

                  CALL plasma_dgetrf( m, n, afac, lda, iwork,

     $                 info )

*

*                 Check error code from DGETRF.

*

                  IF( info.NE.izero )

     $               CALL alaerh( path, 'DGETRF', info, izero, ' ', m,

     $                            n, -1, -1, nb, imat, nfail, nerrs,

     $                            nout )

                  trfcon = .false.

                  nt = 0

*

                  IF( m.NE.n .OR. info.GT.0 ) THEN

*

*                    Do only the condition estimate if INFO > 0.

*

                     trfcon = .true.

                     anormo = dlange( 'O', m, n, a, lda, rwork )

                     anormi = dlange( 'I', m, n, a, lda, rwork )

                     rcondo = zero

                     rcondi = zero

                  END IF

*

*                 Print information about the tests so far that did not

*                 pass the threshold.

*

                  DO 30 k = 1, nt

                     IF( result( k ).GE.thresh ) THEN

                        IF( nfail.EQ.0 .AND. nerrs.EQ.0 )

     $                     CALL alahd( nout, path )

                        WRITE( nout, fmt = 9999 )m, n, nb, imat, k,

     $                     result( k )

                        nfail = nfail + 1

                     END IF

   30             continue

                  nrun = nrun + nt

*

*                 Skip the remaining tests if this is not the first

*                 block size or if M .ne. N.  Skip the solve tests if

*                 the matrix is singular.

*

*                  IF( INB.GT.1 .OR. M.NE.N )

*     $               GO TO 90

                  IF( trfcon )

     $               go to 70

*

                  DO 60 irhs = 1, nns

                     nrhs = nsval( irhs )

                     xtype = 'N'

*

                     DO 50 itran = 1, ntran

                        trans = transs( itran )

                        plasma_trans = plasma_transs( itran )

                        IF( itran.EQ.1 ) THEN

                           rcondc = rcondo

                        ELSE

                           rcondc = rcondi

                        END IF

*

*+    TEST 3

*                       Solve and compute residual for A * X = B.

*

                        srnamt = 'DLARHS'

                        CALL dlarhs( path, xtype, ' ', trans, n, n, kl,

     $                               ku, nrhs, a, lda, xact, lda, b,

     $                               lda, iseed, info )

                        xtype = 'C'

*

                        CALL dlacpy( 'Full', n, nrhs, b, lda, x, lda )

                        srnamt = 'DGETRS'

c$$$                        CALL PLASMA_DGETRS_INCPIV( PLASMA_TRANS, N,

c$$$     $                       NRHS, AFAC, LDA, HL, HPIV,

c$$$     $                       X, LDA, INFO )

                        CALL plasma_dgetrs( plasma_trans, n,

     $                       nrhs, afac, lda, iwork,

     $                       x, lda, info )

*

*                       Check error code from DGETRS.

*

                        IF( info.NE.0 )

     $                     CALL alaerh( path, 'DGETRS', info, 0, trans,

     $                                  n, n, -1, -1, nrhs, imat, nfail,

     $                                  nerrs, nout )

*

                        CALL dlacpy( 'Full', n, nrhs, b, lda, work,

     $                               lda )

                        CALL dget02( trans, n, n, nrhs, a, lda, x, lda,

     $                               work, lda, rwork, result( 3 ) )


*

*+    TEST 4

*                       Check solution from generated exact solution.

*

                        CALL dget04( n, nrhs, x, lda, xact, lda, rcondc,

     $                               result( 4 ) )

*

*                       Print information about the tests that did not

*                       pass the threshold.

*

                        DO 40 k = 3, 4

                           IF( result( k ).GE.thresh ) THEN

                              IF( nfail.EQ.0 .AND. nerrs.EQ.0 )

     $                           CALL alahd( nout, path )

                              WRITE( nout, fmt = 9998 )trans, n, nb,

     $                           nrhs, imat, k, result( k )

                              nfail = nfail + 1

                           END IF

   40                   continue

                        nrun = nrun + 2

   50                continue

   60             continue

*

   70             continue

*

*                 DEALLOCATE HL and HPIV

*

c$$$                  CALL PLASMA_DEALLOC_HANDLE( HL, INFO )

c$$$                  CALL PLASMA_DEALLOC_HANDLE( HPIV, INFO )

   90          continue

  100       continue

  110    continue

  120 continue

*

*     Print a summary of the results.

*

      CALL alasum( path, nout, nfail, nrun, nerrs )

*

 9999 format( ' M = ', i5, ', N =', i5, ', NB =', i4, ', type ', i2,

     $      ', test(', i2, ') =', g12.5 )

 9998 format( ' TRANS=''', a1, ''', N =', i5, ', NB =', i4 ,

',      $      NRHS=', i3, ',type ', i2, ', test(', i2, ') =', g12.5 )

 9997 format( ' NORM =''', a1, ''', N =', i5, ',', 10x, ' type ', i2,

     $      ', test(', i2, ') =', g12.5 )

      return

*

*     End of DCHKGE

*

      END