Cache Blocking
Untuned
REAL*8 A(M,N)
REAL*8 B(N,P)
REAL*8 C(M,P)
DO J=1,P
DO I=1,M
DO K=1,N
C(I,P) = C(I,P) +
A(I,K)*B(K,J)
ENDDO
ENDDO
ENDDO
Tuned
DO JB=1,P,16
DO IB=1,M,16
DO KB=1,N
DO J=JB,MIN(P,JB+15)
DO I=IB,MIN(M,IB+15)
C(I,P) = C(I,P) +
A(I,K)*B(K,J)
ENDDO
ENDDO
ENDDO
ENDDO
ENDDO
ENDDO
Previous slide
Next slide
Back to first slide
View graphic version