libflame  revision_anchor
Functions
FLA_Gemm_tn_unb_var6.c File Reference

(r)

Functions

FLA_Error FLA_Gemm_tn_unb_var6 (FLA_Obj alpha, FLA_Obj A, FLA_Obj B, FLA_Obj beta, FLA_Obj C)
 

Function Documentation

◆ FLA_Gemm_tn_unb_var6()

FLA_Error FLA_Gemm_tn_unb_var6 ( FLA_Obj  alpha,
FLA_Obj  A,
FLA_Obj  B,
FLA_Obj  beta,
FLA_Obj  C 
)

References FLA_Cont_with_3x1_to_2x1(), FLA_Ger_external(), FLA_Obj_length(), FLA_Part_2x1(), FLA_Repart_2x1_to_3x1(), and FLA_Scal_external().

Referenced by FLA_Gemm_tn().

16 {
17  FLA_Obj AT, A0,
18  AB, a1t,
19  A2;
20 
21  FLA_Obj BT, B0,
22  BB, b1t,
23  B2;
24 
25  FLA_Scal_external( beta, C );
26 
27  FLA_Part_2x1( A, &AT,
28  &AB, 0, FLA_BOTTOM );
29 
30  FLA_Part_2x1( B, &BT,
31  &BB, 0, FLA_BOTTOM );
32 
33  while ( FLA_Obj_length( AB ) < FLA_Obj_length( A ) ){
34 
35  FLA_Repart_2x1_to_3x1( AT, &A0,
36  &a1t,
37  /* ** */ /* *** */
38  AB, &A2, 1, FLA_TOP );
39 
40  FLA_Repart_2x1_to_3x1( BT, &B0,
41  &b1t,
42  /* ** */ /* *** */
43  BB, &B2, 1, FLA_TOP );
44 
45  /*------------------------------------------------------------*/
46 
47  /* C = a1t' * b1t + C */
48  FLA_Ger_external( alpha, a1t, b1t, C );
49 
50  /*------------------------------------------------------------*/
51 
52  FLA_Cont_with_3x1_to_2x1( &AT, A0,
53  /* ** */ /* *** */
54  a1t,
55  &AB, A2, FLA_BOTTOM );
56 
57  FLA_Cont_with_3x1_to_2x1( &BT, B0,
58  /* ** */ /* *** */
59  b1t,
60  &BB, B2, FLA_BOTTOM );
61 
62  }
63 
64  return FLA_SUCCESS;
65 }
FLA_Error FLA_Repart_2x1_to_3x1(FLA_Obj AT, FLA_Obj *A0, FLA_Obj *A1, FLA_Obj AB, FLA_Obj *A2, dim_t mb, FLA_Side side)
Definition: FLA_View.c:226
FLA_Error FLA_Scal_external(FLA_Obj alpha, FLA_Obj A)
Definition: FLA_Scal_external.c:13
FLA_Error FLA_Cont_with_3x1_to_2x1(FLA_Obj *AT, FLA_Obj A0, FLA_Obj A1, FLA_Obj *AB, FLA_Obj A2, FLA_Side side)
Definition: FLA_View.c:428
Definition: FLA_type_defs.h:158
FLA_Error FLA_Part_2x1(FLA_Obj A, FLA_Obj *A1, FLA_Obj *A2, dim_t mb, FLA_Side side)
Definition: FLA_View.c:76
FLA_Error FLA_Ger_external(FLA_Obj alpha, FLA_Obj x, FLA_Obj y, FLA_Obj A)
Definition: FLA_Ger_external.c:13
dim_t FLA_Obj_length(FLA_Obj obj)
Definition: FLA_Query.c:116