26 A = (
float *)malloc( (*m)*
LDA*
sizeof( float ) );
29 A[i*
LDA+j]=a[j*(*lda)+i];
33 A = (
float* )malloc(
LDA*(*k)*
sizeof( float ) );
36 A[i*
LDA+j]=a[j*(*lda)+i];
40 B = (
float* )malloc( (*k)*
LDB*
sizeof( float ) );
43 B[i*
LDB+j]=b[j*(*ldb)+i];
47 B = (
float* )malloc(
LDB*(*n)*
sizeof( float ) );
50 B[i*
LDB+j]=b[j*(*ldb)+i];
53 C = (
float* )malloc( (*m)*LDC*
sizeof( float ) );
56 C[i*LDC+j]=c[j*(*ldc)+i];
58 B,
LDB, *beta, C, LDC );
61 c[j*(*ldc)+i]=C[i*LDC+j];
68 b, *ldb, *beta, c, *ldc );
71 b, *ldb, *beta, c, *ldc );
void cblas_sgemm(CBLAS_LAYOUT layout, CBLAS_TRANSPOSE TransA, CBLAS_TRANSPOSE TransB, const CBLAS_INDEX M, const CBLAS_INDEX N, const CBLAS_INDEX K, const float alpha, const float *A, const CBLAS_INDEX lda, const float *B, const CBLAS_INDEX ldb, const float beta, float *C, const CBLAS_INDEX ldc)
void get_transpose_type(char *type, CBLAS_TRANSPOSE *trans)