xref: /aosp_15_r20/external/cblas/src/cblas_cgemv.c (revision 1858f9982ea1ad57fb52080c08594e4d1cce4fa1)
1*1858f998SYi Kong /*
2*1858f998SYi Kong  * cblas_cgemv.c
3*1858f998SYi Kong  * The program is a C interface of cgemv
4*1858f998SYi Kong  *
5*1858f998SYi Kong  * Keita Teranishi  5/20/98
6*1858f998SYi Kong  *
7*1858f998SYi Kong  */
8*1858f998SYi Kong #include <stdio.h>
9*1858f998SYi Kong #include <stdlib.h>
10*1858f998SYi Kong #include "cblas.h"
11*1858f998SYi Kong #include "cblas_f77.h"
cblas_cgemv(const enum CBLAS_ORDER order,const enum CBLAS_TRANSPOSE TransA,const int M,const int N,const void * alpha,const void * A,const int lda,const void * X,const int incX,const void * beta,void * Y,const int incY)12*1858f998SYi Kong void cblas_cgemv(const enum CBLAS_ORDER order,
13*1858f998SYi Kong                  const enum CBLAS_TRANSPOSE TransA, const int M, const int N,
14*1858f998SYi Kong                  const void *alpha, const void  *A, const int lda,
15*1858f998SYi Kong                  const void  *X, const int incX, const void *beta,
16*1858f998SYi Kong                  void  *Y, const int incY)
17*1858f998SYi Kong {
18*1858f998SYi Kong    char TA;
19*1858f998SYi Kong #ifdef F77_CHAR
20*1858f998SYi Kong    F77_CHAR F77_TA;
21*1858f998SYi Kong #else
22*1858f998SYi Kong    #define F77_TA &TA
23*1858f998SYi Kong #endif
24*1858f998SYi Kong #ifdef F77_INT
25*1858f998SYi Kong    F77_INT F77_M=M, F77_N=N, F77_lda=lda, F77_incX=incX, F77_incY=incY;
26*1858f998SYi Kong #else
27*1858f998SYi Kong    #define F77_M M
28*1858f998SYi Kong    #define F77_N N
29*1858f998SYi Kong    #define F77_lda lda
30*1858f998SYi Kong    #define F77_incX incx
31*1858f998SYi Kong    #define F77_incY incY
32*1858f998SYi Kong #endif
33*1858f998SYi Kong 
34*1858f998SYi Kong    int n=0, i=0, incx=incX;
35*1858f998SYi Kong    const float *xx= (const float *)X;
36*1858f998SYi Kong    float ALPHA[2],BETA[2];
37*1858f998SYi Kong    int tincY, tincx;
38*1858f998SYi Kong    float *x=(float *)X, *y=(float *)Y, *st=0, *tx=0;
39*1858f998SYi Kong    const float *stx = x;
40*1858f998SYi Kong    extern int CBLAS_CallFromC;
41*1858f998SYi Kong    extern int RowMajorStrg;
42*1858f998SYi Kong    RowMajorStrg = 0;
43*1858f998SYi Kong 
44*1858f998SYi Kong    CBLAS_CallFromC = 1;
45*1858f998SYi Kong 
46*1858f998SYi Kong    if (order == CblasColMajor)
47*1858f998SYi Kong    {
48*1858f998SYi Kong       if (TransA == CblasNoTrans) TA = 'N';
49*1858f998SYi Kong       else if (TransA == CblasTrans) TA = 'T';
50*1858f998SYi Kong       else if (TransA == CblasConjTrans) TA = 'C';
51*1858f998SYi Kong       else
52*1858f998SYi Kong       {
53*1858f998SYi Kong          cblas_xerbla(2, "cblas_cgemv","Illegal TransA setting, %d\n", TransA);
54*1858f998SYi Kong          CBLAS_CallFromC = 0;
55*1858f998SYi Kong          RowMajorStrg = 0;
56*1858f998SYi Kong          return;
57*1858f998SYi Kong       }
58*1858f998SYi Kong       #ifdef F77_CHAR
59*1858f998SYi Kong          F77_TA = C2F_CHAR(&TA);
60*1858f998SYi Kong       #endif
61*1858f998SYi Kong       F77_cgemv(F77_TA, &F77_M, &F77_N, alpha, A, &F77_lda, X, &F77_incX,
62*1858f998SYi Kong                 beta, Y, &F77_incY);
63*1858f998SYi Kong    }
64*1858f998SYi Kong    else if (order == CblasRowMajor)
65*1858f998SYi Kong    {
66*1858f998SYi Kong       RowMajorStrg = 1;
67*1858f998SYi Kong 
68*1858f998SYi Kong       if (TransA == CblasNoTrans) TA = 'T';
69*1858f998SYi Kong       else if (TransA == CblasTrans) TA = 'N';
70*1858f998SYi Kong       else if (TransA == CblasConjTrans)
71*1858f998SYi Kong       {
72*1858f998SYi Kong          ALPHA[0]=    *( (const float *)  alpha    );
73*1858f998SYi Kong          ALPHA[1]= -( *( (const float *)  alpha+1) );
74*1858f998SYi Kong          BETA[0]=     *( (const float *)  beta     );
75*1858f998SYi Kong          BETA[1]= -(  *( (const float *)  beta+1 ) );
76*1858f998SYi Kong          TA = 'N';
77*1858f998SYi Kong          if (M > 0)
78*1858f998SYi Kong          {
79*1858f998SYi Kong             n = M << 1;
80*1858f998SYi Kong             x = malloc(n*sizeof(float));
81*1858f998SYi Kong             tx = x;
82*1858f998SYi Kong             if( incX > 0 ) {
83*1858f998SYi Kong                i = incX << 1 ;
84*1858f998SYi Kong                tincx = 2;
85*1858f998SYi Kong                st= x+n;
86*1858f998SYi Kong             } else {
87*1858f998SYi Kong                i = incX *(-2);
88*1858f998SYi Kong                tincx = -2;
89*1858f998SYi Kong                st = x-2;
90*1858f998SYi Kong                x +=(n-2);
91*1858f998SYi Kong             }
92*1858f998SYi Kong 
93*1858f998SYi Kong             do
94*1858f998SYi Kong             {
95*1858f998SYi Kong                *x = *xx;
96*1858f998SYi Kong                x[1] = -xx[1];
97*1858f998SYi Kong                x += tincx ;
98*1858f998SYi Kong                xx += i;
99*1858f998SYi Kong             }
100*1858f998SYi Kong             while (x != st);
101*1858f998SYi Kong             x=tx;
102*1858f998SYi Kong 
103*1858f998SYi Kong             F77_incX = 1;
104*1858f998SYi Kong 
105*1858f998SYi Kong             if(incY > 0)
106*1858f998SYi Kong                tincY = incY;
107*1858f998SYi Kong             else
108*1858f998SYi Kong                tincY = -incY;
109*1858f998SYi Kong 
110*1858f998SYi Kong             y++;
111*1858f998SYi Kong 
112*1858f998SYi Kong             if (N > 0)
113*1858f998SYi Kong             {
114*1858f998SYi Kong                i = tincY << 1;
115*1858f998SYi Kong                n = i * N ;
116*1858f998SYi Kong                st = y + n;
117*1858f998SYi Kong                do {
118*1858f998SYi Kong                   *y = -(*y);
119*1858f998SYi Kong                   y += i;
120*1858f998SYi Kong                } while(y != st);
121*1858f998SYi Kong                y -= n;
122*1858f998SYi Kong             }
123*1858f998SYi Kong             stx = x;
124*1858f998SYi Kong          }
125*1858f998SYi Kong          else stx = (const float *)X;
126*1858f998SYi Kong       }
127*1858f998SYi Kong       else
128*1858f998SYi Kong       {
129*1858f998SYi Kong          cblas_xerbla(2, "cblas_cgemv","Illegal TransA setting, %d\n", TransA);
130*1858f998SYi Kong          CBLAS_CallFromC = 0;
131*1858f998SYi Kong          RowMajorStrg = 0;
132*1858f998SYi Kong          return;
133*1858f998SYi Kong       }
134*1858f998SYi Kong       #ifdef F77_CHAR
135*1858f998SYi Kong          F77_TA = C2F_CHAR(&TA);
136*1858f998SYi Kong       #endif
137*1858f998SYi Kong       if (TransA == CblasConjTrans)
138*1858f998SYi Kong          F77_cgemv(F77_TA, &F77_N, &F77_M, ALPHA, A, &F77_lda, stx,
139*1858f998SYi Kong                 &F77_incX, BETA, Y, &F77_incY);
140*1858f998SYi Kong       else
141*1858f998SYi Kong          F77_cgemv(F77_TA, &F77_N, &F77_M, alpha, A, &F77_lda, x,
142*1858f998SYi Kong                 &F77_incX, beta, Y, &F77_incY);
143*1858f998SYi Kong 
144*1858f998SYi Kong       if (TransA == CblasConjTrans)
145*1858f998SYi Kong       {
146*1858f998SYi Kong          if (x != (const float *)X) free(x);
147*1858f998SYi Kong          if (N > 0)
148*1858f998SYi Kong          {
149*1858f998SYi Kong             do
150*1858f998SYi Kong             {
151*1858f998SYi Kong                *y = -(*y);
152*1858f998SYi Kong                y += i;
153*1858f998SYi Kong             }
154*1858f998SYi Kong             while (y != st);
155*1858f998SYi Kong          }
156*1858f998SYi Kong       }
157*1858f998SYi Kong    }
158*1858f998SYi Kong    else cblas_xerbla(1, "cblas_cgemv", "Illegal Order setting, %d\n", order);
159*1858f998SYi Kong    CBLAS_CallFromC = 0;
160*1858f998SYi Kong    RowMajorStrg = 0;
161*1858f998SYi Kong    return;
162*1858f998SYi Kong }
163