|
libflame
12600
|
Functions | |
| FLA_Error | FLA_Gemm_ch_blk_var5 (FLA_Obj alpha, FLA_Obj A, FLA_Obj B, FLA_Obj beta, FLA_Obj C, fla_gemm_t *cntl) |
| FLA_Error FLA_Gemm_ch_blk_var5 | ( | FLA_Obj | alpha, |
| FLA_Obj | A, | ||
| FLA_Obj | B, | ||
| FLA_Obj | beta, | ||
| FLA_Obj | C, | ||
| fla_gemm_t * | cntl | ||
| ) |
References FLA_Cont_with_1x3_to_1x2(), FLA_Determine_blocksize(), FLA_Gemm_internal(), FLA_Obj_width(), FLA_ONE, FLA_Part_1x2(), FLA_Repart_1x2_to_1x3(), and FLA_Scal_internal().
Referenced by FLA_Gemm_ch().
{
FLA_Obj AL, AR, A0, A1, A2;
FLA_Obj BL, BR, B0, B1, B2;
dim_t b;
FLA_Scal_internal( beta, C,
FLA_Cntl_sub_scal( cntl ) );
FLA_Part_1x2( A, &AL, &AR, 0, FLA_LEFT );
FLA_Part_1x2( B, &BL, &BR, 0, FLA_LEFT );
while ( FLA_Obj_width( AL ) < FLA_Obj_width( A ) ){
b = FLA_Determine_blocksize( AR, FLA_RIGHT, FLA_Cntl_blocksize( cntl ) );
FLA_Repart_1x2_to_1x3( AL, /**/ AR, &A0, /**/ &A1, &A2,
b, FLA_RIGHT );
FLA_Repart_1x2_to_1x3( BL, /**/ BR, &B0, /**/ &B1, &B2,
b, FLA_RIGHT );
/*------------------------------------------------------------*/
/* C = alpha * A1 * B1' + C; */
FLA_Gemm_internal( FLA_CONJ_NO_TRANSPOSE, FLA_CONJ_TRANSPOSE,
alpha, A1, B1, FLA_ONE, C,
FLA_Cntl_sub_gemm( cntl ) );
/*------------------------------------------------------------*/
FLA_Cont_with_1x3_to_1x2( &AL, /**/ &AR, A0, A1, /**/ A2,
FLA_LEFT );
FLA_Cont_with_1x3_to_1x2( &BL, /**/ &BR, B0, B1, /**/ B2,
FLA_LEFT );
}
return FLA_SUCCESS;
}
1.7.6.1