plasma/docs/ddrvge_8f_source.html

      SUBROUTINE ddrvge( DOTYPE, NN, NVAL, NRHS, THRESH, TSTERR, NMAX,

     $                   a, afac, asav, b, bsav, x, xact, s, work,

     $                   rwork, iwork, nout )

*

      include 'plasmaf.h'

*

*  -- LAPACK test routine (version 3.1) --

*     Univ. of Tennessee, Univ. of California Berkeley and NAG Ltd..

*     November 2006

*

*     .. Scalar Arguments ..

      LOGICAL            tsterr

      INTEGER            nmax, nn, nout, nrhs

      DOUBLE PRECISION   thresh

*     ..

*     .. Array Arguments ..

      LOGICAL            dotype( * )

      INTEGER            iwork( * ), nval( * )

      DOUBLE PRECISION   a( * ), afac( * ), asav( * ), b( * ),

     $                   bsav( * ), rwork( * ), s( * ), work( * ),

     $                   x( * ), xact( * )

*     ..

*

*  Purpose

*  =======

*

*  DDRVGE tests the driver routines DGESV and -SVX.

*

*  Arguments

*  =========

*

*  DOTYPE  (input) LOGICAL array, dimension (NTYPES)

*          The matrix types to be used for testing.  Matrices of type j

*          (for 1 <= j <= NTYPES) are used for testing if DOTYPE(j) =

*          .TRUE.; if DOTYPE(j) = .FALSE., then type j is not used.

*

*  NN      (input) INTEGER

*          The number of values of N contained in the vector NVAL.

*

*  NVAL    (input) INTEGER array, dimension (NN)

*          The values of the matrix column dimension N.

*

*  NRHS    (input) INTEGER

*          The number of right hand side vectors to be generated for

*          each linear system.

*

*  THRESH  (input) DOUBLE PRECISION

*          The threshold value for the test ratios.  A result is

*          included in the output file if RESULT >= THRESH.  To have

*          every test ratio printed, use THRESH = 0.

*

*  TSTERR  (input) LOGICAL

*          Flag that indicates whether error exits are to be tested.

*

*  NMAX    (input) INTEGER

*          The maximum value permitted for N, used in dimensioning the

*          work arrays.

*

*  A       (workspace) DOUBLE PRECISION array, dimension (NMAX*NMAX)

*

*  AFAC    (workspace) DOUBLE PRECISION array, dimension (NMAX*NMAX)

*

*  ASAV    (workspace) DOUBLE PRECISION array, dimension (NMAX*NMAX)

*

*  B       (workspace) DOUBLE PRECISION array, dimension (NMAX*NRHS)

*

*  BSAV    (workspace) DOUBLE PRECISION array, dimension (NMAX*NRHS)

*

*  X       (workspace) DOUBLE PRECISION array, dimension (NMAX*NRHS)

*

*  XACT    (workspace) DOUBLE PRECISION array, dimension (NMAX*NRHS)

*

*  S       (workspace) DOUBLE PRECISION array, dimension (2*NMAX)

*

*  WORK    (workspace) DOUBLE PRECISION array, dimension

*                      (NMAX*max(3,NRHS))

*

*  RWORK   (workspace) DOUBLE PRECISION array, dimension (2*NRHS+NMAX)

*

*  IWORK   (workspace) INTEGER array, dimension (2*NMAX)

*

*  NOUT    (input) INTEGER

*          The unit number for output.

*

*  =====================================================================

*

*     .. Parameters ..

      DOUBLE PRECISION   one, zero

      parameter( one = 1.0d+0, zero = 0.0d+0 )

      INTEGER            ntypes

      parameter( ntypes = 11 )

      INTEGER            ntests

      parameter( ntests = 7 )

*     ONLY NOTRANS SUPPORTED !!!

      INTEGER            ntran

      parameter( ntran = 1 )

*     ..

*     .. Local Scalars ..

      LOGICAL            equil, nofact, prefac, trfcon, zerot

      CHARACTER          dist, equed, fact, trans, type, xtype

      CHARACTER*3        path

      INTEGER            i, iequed, ifact, imat, in, info, ioff, itran,

     $                   izero, k, k1, kl, ku, lda, lwork, mode, n, nb,

     $                   nbmin, nerrs, nfact, nfail, nimat, nrun, nt, ib

      INTEGER            hl( 2 ), hpiv( 2 )

      INTEGER            plasma_trans

      DOUBLE PRECISION   ainvnm, amax, anorm, anormi, anormo, cndnum,

     $                   colcnd, rcond, rcondc, rcondi, rcondo, roldc,

     $                   roldi, roldo, rowcnd, rpvgrw

*     ..

*     .. Local Arrays ..

      CHARACTER          equeds( 4 ), facts( 3 ), transs( ntran )

      INTEGER            iseed( 4 ), iseedy( 4 ), plasma_transs( ntran )

      DOUBLE PRECISION   result( ntests )

*     ..

*     .. External Functions ..

      LOGICAL            lsame

      DOUBLE PRECISION   dget06, dlamch, dlange, dlantr

      EXTERNAL           lsame, dget06, dlamch, dlange, dlantr

*     ..

*     .. External Subroutines ..

      EXTERNAL           aladhd, alaerh, alasvm, derrvx, dgeequ, dgesv,

     $                   dgesvx, dget02, dget04, dgetrf,

     $                   dgetri, dlacpy, dlaqge, dlarhs, dlaset, dlatb4,

     $                   dlatms, xlaenv

*     ..

*     .. Intrinsic Functions ..

      INTRINSIC          abs, max

*     ..

*     .. Scalars in Common ..

      LOGICAL            lerr, ok

      CHARACTER*32       srnamt

      INTEGER            infot, nunit

*     ..

*     .. Common blocks ..

      common             / infoc / infot, nunit, ok, lerr

      common             / srnamc / srnamt

*     ..

*     .. Data statements ..

      DATA               iseedy / 1988, 1989, 1990, 1991 /

*      DATA               TRANSS / 'N', 'T', 'C' /

      DATA               transs / 'N' /

      DATA               plasma_transs / plasmanotrans /

      DATA               facts / 'F', 'N', 'E' /

      DATA               equeds / 'N', 'R', 'C', 'B' /

*     ..

*     .. Executable Statements ..

*

*     Initialize constants and the random number seed.

*

      path( 1: 1 ) = 'Double precision'

      path( 2: 3 ) = 'GE'

      rcondo = zero

      rcondi = zero

      nrun = 0

      nfail = 0

      nerrs = 0

      DO 10 i = 1, 4

         iseed( i ) = iseedy( i )

   10 continue

*

*     Test the error exits

*

      IF( tsterr )

     $   CALL derrvx( path, nout )

      infot = 0

*

*     Set the block size and minimum block size for testing.

*

      nb = 128

      ib = 32

      nbmin = 32

      CALL xlaenv( 1, nb )

      CALL xlaenv( 2, nbmin )

      CALL plasma_set( plasma_tile_size, nb, info )

      CALL plasma_set( plasma_inner_block_size, ib, info )

*

*     Do for each value of N in NVAL

*

      DO 90 in = 1, nn

         n = nval( in )

         lda = max( n, 1 )

         xtype = 'N'

         nimat = ntypes

         IF( n.LE.0 )

     $      nimat = 1

*

*        ALLOCATE L and IPIV

*

c$$$         CALL PLASMA_ALLOC_WORKSPACE_DGETRF_INCPIV(

c$$$     $        N, N, HL, HPIV, INFO )

*

         DO 80 imat = 1, nimat

*

*           Do the tests only if DOTYPE( IMAT ) is true.

*

            IF( .NOT.dotype( imat ) )

     $         go to 80

*

*           Skip types 5, 6, or 7 if the matrix size is too small.

*

            zerot = imat.GE.5 .AND. imat.LE.7

            IF( zerot .AND. n.LT.imat-4 )

     $         go to 80

*

*           Set up parameters with DLATB4 and generate a test matrix

*           with DLATMS.

*

            CALL dlatb4( path, imat, n, n, type, kl, ku, anorm, mode,

     $                   cndnum, dist )

            rcondc = one / cndnum

*

            srnamt = 'DLATMS'

            CALL dlatms( n, n, dist, iseed, type, rwork, mode, cndnum,

     $                   anorm, kl, ku, 'No packing', a, lda, work,

     $                   info )

*

*           Check error code from DLATMS.

*

            IF( info.NE.0 ) THEN

               CALL alaerh( path, 'DLATMS', info, 0, ' ', n, n, -1, -1,

     $                      -1, imat, nfail, nerrs, nout )

               go to 80

            END IF

*

*           For types 5-7, zero one or more columns of the matrix to

*           test that INFO is returned correctly.

*

            IF( zerot ) THEN

               IF( imat.EQ.5 ) THEN

                  izero = 1

               ELSE IF( imat.EQ.6 ) THEN

                  izero = n

               ELSE

                  izero = n / 2 + 1

               END IF

               ioff = ( izero-1 )*lda

               IF( imat.LT.7 ) THEN

                  DO 20 i = 1, n

                     a( ioff+i ) = zero

   20             continue

               ELSE

                  CALL dlaset( 'Full', n, n-izero+1, zero, zero,

     $                         a( ioff+1 ), lda )

               END IF

            ELSE

               izero = 0

            END IF

*

*           Save a copy of the matrix A in ASAV.

*

            CALL dlacpy( 'Full', n, n, a, lda, asav, lda )

*

            DO 70 iequed = 1, 4

               equed = equeds( iequed )

               IF( iequed.EQ.1 ) THEN

                  nfact = 3

               ELSE

                  nfact = 1

               END IF

*

               DO 60 ifact = 1, nfact

                  fact = facts( ifact )

                  prefac = lsame( fact, 'F' )

                  nofact = lsame( fact, 'N' )

                  equil = lsame( fact, 'E' )

*

                  IF( zerot ) THEN

                     IF( prefac )

     $                  go to 60

                     rcondo = zero

                     rcondi = zero

*

                  ELSE IF( .NOT.nofact ) THEN

*

*                    Compute the condition number for comparison with

*                    the value returned by DGESVX (FACT = 'N' reuses

*                    the condition number from the previous iteration

*                    with FACT = 'F').

*

                     CALL dlacpy( 'Full', n, n, asav, lda, afac, lda )

                     IF( equil .OR. iequed.GT.1 ) THEN

*

*                       Compute row and column scale factors to

*                       equilibrate the matrix A.

*

                        CALL dgeequ( n, n, afac, lda, s, s( n+1 ),

     $                               rowcnd, colcnd, amax, info )

                        IF( info.EQ.0 .AND. n.GT.0 ) THEN

                           IF( lsame( equed, 'R' ) ) THEN

                              rowcnd = zero

                              colcnd = one

                           ELSE IF( lsame( equed, 'C' ) ) THEN

                              rowcnd = one

                              colcnd = zero

                           ELSE IF( lsame( equed, 'B' ) ) THEN

                              rowcnd = zero

                              colcnd = zero

                           END IF

*

*                          Equilibrate the matrix.

*

                           CALL dlaqge( n, n, afac, lda, s, s( n+1 ),

     $                                  rowcnd, colcnd, amax, equed )

                        END IF

                     END IF

*

*                    Save the condition number of the non-equilibrated

*                    system for use in DGET04.

*

                     IF( equil ) THEN

                        roldo = rcondo

                        roldi = rcondi

                     END IF

*

*                    Compute the 1-norm and infinity-norm of A.

*

                     anormo = dlange( '1', n, n, afac, lda, rwork )

                     anormi = dlange( 'I', n, n, afac, lda, rwork )

*

*                    Factor the matrix A.

*

c$$$                     CALL PLASMA_DGETRF_INCPIV( N, N, AFAC, LDA,

c$$$     $                                   HL, HPIV, INFO )

                     CALL plasma_dgetrf( n, n, afac, lda,

     $                                   iwork, info )

                  END IF

*

                  DO 50 itran = 1, ntran

*

*                    Do for each value of TRANS.

*

                     trans = transs( itran )

                     plasma_trans = plasma_transs( itran )

                     IF( itran.EQ.1 ) THEN

                        rcondc = rcondo

                     ELSE

                        rcondc = rcondi

                     END IF

*

*                    Restore the matrix A.

*

                     CALL dlacpy( 'Full', n, n, asav, lda, a, lda )

*

*                    Form an exact solution and set the right hand side.

*

                     srnamt = 'DLARHS'

                     CALL dlarhs( path, xtype, 'Full', trans, n, n, kl,

     $                            ku, nrhs, a, lda, xact, lda, b, lda,

     $                            iseed, info )

                     xtype = 'C'

                     CALL dlacpy( 'Full', n, nrhs, b, lda, bsav, lda )

*

                     IF( nofact .AND. itran.EQ.1 ) THEN

*

*                       --- Test DGESV  ---

*

*                       Compute the LU factorization of the matrix and

*                       solve the system.

*

                        CALL dlacpy( 'Full', n, n, a, lda, afac, lda )

                        CALL dlacpy( 'Full', n, nrhs, b, lda, x, lda )

*

                        srnamt = 'DGESV '

c$$$                        CALL PLASMA_DGESV_INCPIV( N, NRHS, AFAC, LDA,

c$$$     $                       HL, HPIV, X, LDA, INFO )

                        CALL plasma_dgesv( n, nrhs, afac, lda,

     $                       iwork, x, lda, info )

*

*                       Check error code from DGESV .

*

                        IF( info.NE.izero )

     $                     CALL alaerh( path, 'DGESV ', info, izero,

     $                                  ' ', n, n, -1, -1, nrhs, imat,

     $                                  nfail, nerrs, nout )

                        IF( izero.EQ.0 ) THEN

*

*                          Compute residual of the computed solution.

*

                           CALL dlacpy( 'Full', n, nrhs, b, lda, work,

     $                                  lda )

                           CALL dget02( 'No transpose', n, n, nrhs, a,

     $                                  lda, x, lda, work, lda, rwork,

     $                                  result( 1 ) )

*

*                          Check solution from generated exact solution.

*

                           CALL dget04( n, nrhs, x, lda, xact, lda,

     $                                  rcondc, result( 2 ) )

                           nt = 2

                        END IF

*

*                       Print information about the tests that did not

*                       pass the threshold.

*

                        DO 30 k = 1, nt

                           IF( result( k ).GE.thresh ) THEN

                              IF( nfail.EQ.0 .AND. nerrs.EQ.0 )

     $                           CALL aladhd( nout, path )

                              WRITE( nout, fmt = 9999 )'DGESV ', n, ib,

     $                           imat, k, result( k )

                              nfail = nfail + 1

                           END IF

   30                   continue

                        nrun = nrun + nt

                     END IF

   50             continue

   60          continue

   70       continue

   80    continue

*

*        DEALLOCATE HL and HPIV

*

c$$$         CALL PLASMA_DEALLOC_HANDLE( HL, INFO )

c$$$         CALL PLASMA_DEALLOC_HANDLE( HPIV, INFO )

   90 continue

*

*     Print a summary of the results.

*

      CALL alasvm( path, nout, nfail, nrun, nerrs )

*

 9999 format( 1x, a, ', N =', i5,', NB=', i5, ', type ', i2,

     $      ', test(', i2, ') =', g12.5 )

 9998 format( 1x, a, ', FACT=''', a1, ''', TRANS=''', a1, ''', N=', i5,

     $      ', type ', i2, ', test(', i1, ')=', g12.5 )

 9997 format( 1x, a, ', FACT=''', a1, ''', TRANS=''', a1, ''', N=', i5,

     $      ', EQUED=''', a1, ''', type ', i2, ', test(', i1, ')=',

     $      g12.5 )

      return

*

*     End of DDRVGE

*

      END