Parent: [3b207b] (diff)

Child: [28b809] (diff)

Download this file

LibDBlasL3F77.def    103 lines (90 with data), 5.5 kB

  1
  2
  3
  4
  5
  6
  7
  8
  9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
DEFINITION MODULE LibDBlasL3F77;
(*------------------------------------------------------------------------*)
(* Schnittstell zu Level 3 Blas FORTRAN77 Subroutinen. *)
(* Interface to level 3 Blas FORTRAN77 subroutines. *)
(*------------------------------------------------------------------------*)
(* Implementation : Michael Riedl *)
(* Licence : GNU Lesser General Public License (LGPL) *)
(*------------------------------------------------------------------------*)
(* $Id: LibDBlasL3F77.def,v 1.2 2018/09/12 13:20:06 mriedl Exp $ *)
FROM LibDBlasL1F77 IMPORT INTEGER4,REAL4,DOUBLEPRECISION,DOUBLECOMPLEX;
PROCEDURE sgemm( TA : CHAR;
TB : CHAR;
M,N,K : INTEGER4;
Alpha : REAL4;
VAR A : ARRAY OF ARRAY OF REAL4;
lda : INTEGER;
VAR B : ARRAY OF ARRAY OF REAL4;
ldb : INTEGER;
Beta : REAL4;
VAR C : ARRAY OF ARRAY OF REAL4;
ldc : INTEGER);
(*---------------------------------------------------------------*)
(* Aufruf der Fortran Version der BLAS3 subroutine sgemm *)
(* *)
(* Call to the Fortran version of the BLAS3 subroutine sgemm *)
(*---------------------------------------------------------------*)
PROCEDURE dgemm( TA : CHAR;
TB : CHAR;
M,N,K : INTEGER4;
Alpha : DOUBLEPRECISION;
VAR A : ARRAY OF ARRAY OF DOUBLEPRECISION;
lda : INTEGER;
VAR B : ARRAY OF ARRAY OF DOUBLEPRECISION;
ldb : INTEGER;
Beta : DOUBLEPRECISION;
VAR C : ARRAY OF ARRAY OF DOUBLEPRECISION;
ldc : INTEGER);
(*---------------------------------------------------------------*)
(* Aufruf der Fortran Version der BLAS3 subroutine dgemm *)
(* *)
(* Please note that lda,ldb and ldc are meaningless here as they *)
(* will be set automatically within the Modula-2 wrapper routine *)
(* which also takes care that the called does not need to worry *)
(* about the row major memory model used in Fortran *)
(*---------------------------------------------------------------*)
PROCEDURE dgemmOMP( TA : CHAR;
TB : CHAR;
M,N,K : INTEGER4;
Alpha : DOUBLEPRECISION;
VAR A : ARRAY OF ARRAY OF DOUBLEPRECISION;
lda : INTEGER;
VAR B : ARRAY OF ARRAY OF DOUBLEPRECISION;
ldb : INTEGER;
Beta : DOUBLEPRECISION;
VAR C : ARRAY OF ARRAY OF DOUBLEPRECISION;
ldc : INTEGER);
(*---------------------------------------------------------------*)
(* Aufruf der Fortran Version der BLAS3 subroutine dgemm in der *)
(* OpenMP paralellisierten version *)
(* *)
(* dgemmOMP is far from beeing optimal - please test if it is *)
(* really improving the performance in your sprecific *)
(* environment. On 32 bit systems the communication overhead *)
(* outperforms the potential gain in speed by using more than *)
(* one thread in many cases. But even on a outdated Atom single *)
(* core processor a two threads version was about 40 % quicker *)
(* than the single theread version. So you need to test ... *)
(* and do not make the physical size of A,B and C much bigger *)
(* than needed - that will also slow down. *)
(*---------------------------------------------------------------*)
PROCEDURE zgemm( TA : CHAR;
TB : CHAR;
M,N,K : INTEGER4;
Alpha : DOUBLECOMPLEX;
VAR A : ARRAY OF ARRAY OF DOUBLECOMPLEX;
lda : INTEGER;
VAR B : ARRAY OF ARRAY OF DOUBLECOMPLEX;
ldb : INTEGER;
Beta : DOUBLECOMPLEX;
VAR C : ARRAY OF ARRAY OF DOUBLECOMPLEX;
ldc : INTEGER);
(*---------------------------------------------------------------*)
(* Aufruf der Fortran Version der BLAS3 subroutine zgemm *)
(* *)
(* Please note that lda,ldb and ldc are meaningless here as they *)
(* will be set automatically within the Modula-2 wrapper routine *)
(* which also takes care that the called does not need to worry *)
(* about the row major memory model used in Fortran *)
(*---------------------------------------------------------------*)
END LibDBlasL3F77.