18 {
19
20 float *A, *B, *C;
23
26
29 LDA = *k+1;
30 A = (float *)malloc( (*m)*LDA*sizeof( float ) );
31 for( i=0; i<*m; i++ )
32 for( j=0; j<*k; j++ )
33 A[i*LDA+j]=a[j*(*lda)+i];
34 }
35 else {
36 LDA = *m+1;
37 A = ( float* )malloc( LDA*(*k)*sizeof( float ) );
38 for( i=0; i<*k; i++ )
39 for( j=0; j<*m; j++ )
40 A[i*LDA+j]=a[j*(*lda)+i];
41 }
43 LDB = *n+1;
44 B = ( float* )malloc( (*k)*LDB*sizeof( float ) );
45 for( i=0; i<*k; i++ )
46 for( j=0; j<*n; j++ )
47 B[i*LDB+j]=b[j*(*ldb)+i];
48 }
49 else {
50 LDB = *k+1;
51 B = ( float* )malloc( LDB*(*n)*sizeof( float ) );
52 for( i=0; i<*n; i++ )
53 for( j=0; j<*k; j++ )
54 B[i*LDB+j]=b[j*(*ldb)+i];
55 }
56 LDC = *n+1;
57 C = ( float* )malloc( (*m)*LDC*sizeof( float ) );
58 for( j=0; j<*n; j++ )
59 for( i=0; i<*m; i++ )
60 C[i*LDC+j]=c[j*(*ldc)+i];
62 B, LDB, *beta, C, LDC );
63 for( j=0; j<*n; j++ )
64 for( i=0; i<*m; i++ )
65 c[j*(*ldc)+i]=C[i*LDC+j];
66 free(A);
67 free(B);
68 free(C);
69 }
72 b, *ldb, *beta, c, *ldc );
73 else
75 b, *ldb, *beta, c, *ldc );
76}
void cblas_sgemm(CBLAS_LAYOUT layout, CBLAS_TRANSPOSE TransA, CBLAS_TRANSPOSE TransB, const CBLAS_INT M, const CBLAS_INT N, const CBLAS_INT K, const float alpha, const float *A, const CBLAS_INT lda, const float *B, const CBLAS_INT ldb, const float beta, float *C, const CBLAS_INT ldc)
void get_transpose_type(char *type, CBLAS_TRANSPOSE *trans)