1*1858f998SYi Kong /*
2*1858f998SYi Kong *
3*1858f998SYi Kong * cblas_sgemm.c
4*1858f998SYi Kong * This program is a C interface to sgemm.
5*1858f998SYi Kong * Written by Keita Teranishi
6*1858f998SYi Kong * 4/8/1998
7*1858f998SYi Kong *
8*1858f998SYi Kong */
9*1858f998SYi Kong
10*1858f998SYi Kong #include "cblas.h"
11*1858f998SYi Kong #include "cblas_f77.h"
cblas_sgemm(const enum CBLAS_ORDER Order,const enum CBLAS_TRANSPOSE TransA,const enum CBLAS_TRANSPOSE TransB,const int M,const int N,const int K,const float alpha,const float * A,const int lda,const float * B,const int ldb,const float beta,float * C,const int ldc)12*1858f998SYi Kong void cblas_sgemm(const enum CBLAS_ORDER Order, const enum CBLAS_TRANSPOSE TransA,
13*1858f998SYi Kong const enum CBLAS_TRANSPOSE TransB, const int M, const int N,
14*1858f998SYi Kong const int K, const float alpha, const float *A,
15*1858f998SYi Kong const int lda, const float *B, const int ldb,
16*1858f998SYi Kong const float beta, float *C, const int ldc)
17*1858f998SYi Kong {
18*1858f998SYi Kong char TA, TB;
19*1858f998SYi Kong #ifdef F77_CHAR
20*1858f998SYi Kong F77_CHAR F77_TA, F77_TB;
21*1858f998SYi Kong #else
22*1858f998SYi Kong #define F77_TA &TA
23*1858f998SYi Kong #define F77_TB &TB
24*1858f998SYi Kong #endif
25*1858f998SYi Kong
26*1858f998SYi Kong #ifdef F77_INT
27*1858f998SYi Kong F77_INT F77_M=M, F77_N=N, F77_K=K, F77_lda=lda, F77_ldb=ldb;
28*1858f998SYi Kong F77_INT F77_ldc=ldc;
29*1858f998SYi Kong #else
30*1858f998SYi Kong #define F77_M M
31*1858f998SYi Kong #define F77_N N
32*1858f998SYi Kong #define F77_K K
33*1858f998SYi Kong #define F77_lda lda
34*1858f998SYi Kong #define F77_ldb ldb
35*1858f998SYi Kong #define F77_ldc ldc
36*1858f998SYi Kong #endif
37*1858f998SYi Kong
38*1858f998SYi Kong extern int CBLAS_CallFromC;
39*1858f998SYi Kong extern int RowMajorStrg;
40*1858f998SYi Kong RowMajorStrg = 0;
41*1858f998SYi Kong CBLAS_CallFromC = 1;
42*1858f998SYi Kong if( Order == CblasColMajor )
43*1858f998SYi Kong {
44*1858f998SYi Kong if(TransA == CblasTrans) TA='T';
45*1858f998SYi Kong else if ( TransA == CblasConjTrans ) TA='C';
46*1858f998SYi Kong else if ( TransA == CblasNoTrans ) TA='N';
47*1858f998SYi Kong else
48*1858f998SYi Kong {
49*1858f998SYi Kong cblas_xerbla(2, "cblas_sgemm",
50*1858f998SYi Kong "Illegal TransA setting, %d\n", TransA);
51*1858f998SYi Kong CBLAS_CallFromC = 0;
52*1858f998SYi Kong RowMajorStrg = 0;
53*1858f998SYi Kong return;
54*1858f998SYi Kong }
55*1858f998SYi Kong
56*1858f998SYi Kong if(TransB == CblasTrans) TB='T';
57*1858f998SYi Kong else if ( TransB == CblasConjTrans ) TB='C';
58*1858f998SYi Kong else if ( TransB == CblasNoTrans ) TB='N';
59*1858f998SYi Kong else
60*1858f998SYi Kong {
61*1858f998SYi Kong cblas_xerbla(3, "cblas_sgemm",
62*1858f998SYi Kong "Illegal TransB setting, %d\n", TransB);
63*1858f998SYi Kong CBLAS_CallFromC = 0;
64*1858f998SYi Kong RowMajorStrg = 0;
65*1858f998SYi Kong return;
66*1858f998SYi Kong }
67*1858f998SYi Kong
68*1858f998SYi Kong #ifdef F77_CHAR
69*1858f998SYi Kong F77_TA = C2F_CHAR(&TA);
70*1858f998SYi Kong F77_TB = C2F_CHAR(&TB);
71*1858f998SYi Kong #endif
72*1858f998SYi Kong
73*1858f998SYi Kong F77_sgemm(F77_TA, F77_TB, &F77_M, &F77_N, &F77_K, &alpha, A, &F77_lda, B, &F77_ldb, &beta, C, &F77_ldc);
74*1858f998SYi Kong } else if (Order == CblasRowMajor)
75*1858f998SYi Kong {
76*1858f998SYi Kong RowMajorStrg = 1;
77*1858f998SYi Kong if(TransA == CblasTrans) TB='T';
78*1858f998SYi Kong else if ( TransA == CblasConjTrans ) TB='C';
79*1858f998SYi Kong else if ( TransA == CblasNoTrans ) TB='N';
80*1858f998SYi Kong else
81*1858f998SYi Kong {
82*1858f998SYi Kong cblas_xerbla(2, "cblas_sgemm",
83*1858f998SYi Kong "Illegal TransA setting, %d\n", TransA);
84*1858f998SYi Kong CBLAS_CallFromC = 0;
85*1858f998SYi Kong RowMajorStrg = 0;
86*1858f998SYi Kong return;
87*1858f998SYi Kong }
88*1858f998SYi Kong if(TransB == CblasTrans) TA='T';
89*1858f998SYi Kong else if ( TransB == CblasConjTrans ) TA='C';
90*1858f998SYi Kong else if ( TransB == CblasNoTrans ) TA='N';
91*1858f998SYi Kong else
92*1858f998SYi Kong {
93*1858f998SYi Kong cblas_xerbla(2, "cblas_sgemm",
94*1858f998SYi Kong "Illegal TransA setting, %d\n", TransA);
95*1858f998SYi Kong CBLAS_CallFromC = 0;
96*1858f998SYi Kong RowMajorStrg = 0;
97*1858f998SYi Kong return;
98*1858f998SYi Kong }
99*1858f998SYi Kong #ifdef F77_CHAR
100*1858f998SYi Kong F77_TA = C2F_CHAR(&TA);
101*1858f998SYi Kong F77_TB = C2F_CHAR(&TB);
102*1858f998SYi Kong #endif
103*1858f998SYi Kong
104*1858f998SYi Kong F77_sgemm(F77_TA, F77_TB, &F77_N, &F77_M, &F77_K, &alpha, B, &F77_ldb, A, &F77_lda, &beta, C, &F77_ldc);
105*1858f998SYi Kong } else
106*1858f998SYi Kong cblas_xerbla(1, "cblas_sgemm",
107*1858f998SYi Kong "Illegal Order setting, %d\n", Order);
108*1858f998SYi Kong CBLAS_CallFromC = 0;
109*1858f998SYi Kong RowMajorStrg = 0;
110*1858f998SYi Kong }
111