libflame  revision_anchor
Functions
FLA_LU_piv_unb_var4.c File Reference

(r)

Functions

FLA_Error FLA_LU_piv_unb_var4 (FLA_Obj A, FLA_Obj p)
 

Function Documentation

◆ FLA_LU_piv_unb_var4()

FLA_Error FLA_LU_piv_unb_var4 ( FLA_Obj  A,
FLA_Obj  p 
)

References FLA_Amax_external(), FLA_Apply_pivots(), FLA_Cont_with_3x1_to_2x1(), FLA_Cont_with_3x3_to_2x2(), FLA_Dots_external(), FLA_Gemv_external(), FLA_Inv_scal_external(), FLA_Merge_2x1(), FLA_MINUS_ONE, FLA_Obj_length(), FLA_Obj_width(), FLA_ONE, FLA_Part_2x1(), FLA_Part_2x2(), FLA_Repart_2x1_to_3x1(), and FLA_Repart_2x2_to_3x3().

Referenced by FLA_LU_piv_internal().

16 {
17  FLA_Obj ATL, ATR, A00, a01, A02,
18  ABL, ABR, a10t, alpha11, a12t,
19  A20, a21, A22;
20 
21  FLA_Obj pT, p0,
22  pB, pi1,
23  p2;
24 
25  FLA_Obj AB0, aB1, AB2;
26 
27 
28  FLA_Part_2x2( A, &ATL, &ATR,
29  &ABL, &ABR, 0, 0, FLA_TL );
30 
31  FLA_Part_2x1( p, &pT,
32  &pB, 0, FLA_TOP );
33 
34  while ( FLA_Obj_length( ATL ) < FLA_Obj_length( A ) &&
35  FLA_Obj_width( ATL ) < FLA_Obj_width( A )){
36 
37  FLA_Repart_2x2_to_3x3( ATL, /**/ ATR, &A00, /**/ &a01, &A02,
38  /* ************* */ /* ************************** */
39  &a10t, /**/ &alpha11, &a12t,
40  ABL, /**/ ABR, &A20, /**/ &a21, &A22,
41  1, 1, FLA_BR );
42 
43  FLA_Repart_2x1_to_3x1( pT, &p0,
44  /* ** */ /* *** */
45  &pi1,
46  pB, &p2, 1, FLA_BOTTOM );
47 
48  /*------------------------------------------------------------*/
49 
50  // alpha11 = alpha11 - a10t * a01
51  FLA_Dots_external( FLA_MINUS_ONE, a10t, a01, FLA_ONE, alpha11 );
52 
53  // a21 = a21 - A20 * a01
54  FLA_Gemv_external( FLA_NO_TRANSPOSE, FLA_MINUS_ONE, A20, a01, FLA_ONE, a21 );
55 
56  // aB1 = / alpha11 \
57  // \ a21 /
58  FLA_Merge_2x1( alpha11,
59  a21, &aB1 );
60 
61  // Determine pivot index
62  FLA_Amax_external( aB1, pi1 );
63 
64  // Apply pivots to current column
65  FLA_Apply_pivots( FLA_LEFT, FLA_NO_TRANSPOSE, pi1, aB1 );
66 
67  // AB0 = / a10t \
68  // \ A20 /
69  FLA_Merge_2x1( a10t,
70  A20, &AB0 );
71 
72  // AB2 = / a12t \
73  // \ A22 /
74  FLA_Merge_2x1( a12t,
75  A22, &AB2 );
76 
77  // Apply pivots to remaining columns
78  FLA_Apply_pivots( FLA_LEFT, FLA_NO_TRANSPOSE, pi1, AB0 );
79  FLA_Apply_pivots( FLA_LEFT, FLA_NO_TRANSPOSE, pi1, AB2 );
80 
81  // a21 = a21 / alpha11
82  FLA_Inv_scal_external( alpha11, a21 );
83 
84  // a12t = a12t - a10t * A02
85  FLA_Gemv_external( FLA_TRANSPOSE, FLA_MINUS_ONE, A02, a10t, FLA_ONE, a12t );
86 
87  /*------------------------------------------------------------*/
88 
89  FLA_Cont_with_3x3_to_2x2( &ATL, /**/ &ATR, A00, a01, /**/ A02,
90  a10t, alpha11, /**/ a12t,
91  /* ************** */ /* ************************ */
92  &ABL, /**/ &ABR, A20, a21, /**/ A22,
93  FLA_TL );
94 
95  FLA_Cont_with_3x1_to_2x1( &pT, p0,
96  pi1,
97  /* ** */ /* *** */
98  &pB, p2, FLA_TOP );
99 
100  }
101 
102  return FLA_SUCCESS;
103 }
FLA_Error FLA_Repart_2x1_to_3x1(FLA_Obj AT, FLA_Obj *A0, FLA_Obj *A1, FLA_Obj AB, FLA_Obj *A2, dim_t mb, FLA_Side side)
Definition: FLA_View.c:226
FLA_Error FLA_Dots_external(FLA_Obj alpha, FLA_Obj x, FLA_Obj y, FLA_Obj beta, FLA_Obj rho)
Definition: FLA_Dots_external.c:13
FLA_Error FLA_Inv_scal_external(FLA_Obj alpha, FLA_Obj A)
Definition: FLA_Inv_scal_external.c:13
FLA_Error FLA_Gemv_external(FLA_Trans transa, FLA_Obj alpha, FLA_Obj A, FLA_Obj x, FLA_Obj beta, FLA_Obj y)
Definition: FLA_Gemv_external.c:13
FLA_Obj FLA_MINUS_ONE
Definition: FLA_Init.c:22
FLA_Error FLA_Repart_2x2_to_3x3(FLA_Obj ATL, FLA_Obj ATR, FLA_Obj *A00, FLA_Obj *A01, FLA_Obj *A02, FLA_Obj *A10, FLA_Obj *A11, FLA_Obj *A12, FLA_Obj ABL, FLA_Obj ABR, FLA_Obj *A20, FLA_Obj *A21, FLA_Obj *A22, dim_t mb, dim_t nb, FLA_Quadrant quadrant)
Definition: FLA_View.c:142
FLA_Error FLA_Cont_with_3x1_to_2x1(FLA_Obj *AT, FLA_Obj A0, FLA_Obj A1, FLA_Obj *AB, FLA_Obj A2, FLA_Side side)
Definition: FLA_View.c:428
FLA_Error FLA_Part_2x2(FLA_Obj A, FLA_Obj *A11, FLA_Obj *A12, FLA_Obj *A21, FLA_Obj *A22, dim_t mb, dim_t nb, FLA_Quadrant quadrant)
Definition: FLA_View.c:17
FLA_Obj FLA_ONE
Definition: FLA_Init.c:18
Definition: FLA_type_defs.h:158
dim_t FLA_Obj_width(FLA_Obj obj)
Definition: FLA_Query.c:123
FLA_Error FLA_Part_2x1(FLA_Obj A, FLA_Obj *A1, FLA_Obj *A2, dim_t mb, FLA_Side side)
Definition: FLA_View.c:76
FLA_Error FLA_Cont_with_3x3_to_2x2(FLA_Obj *ATL, FLA_Obj *ATR, FLA_Obj A00, FLA_Obj A01, FLA_Obj A02, FLA_Obj A10, FLA_Obj A11, FLA_Obj A12, FLA_Obj *ABL, FLA_Obj *ABR, FLA_Obj A20, FLA_Obj A21, FLA_Obj A22, FLA_Quadrant quadrant)
Definition: FLA_View.c:304
FLA_Error FLA_Apply_pivots(FLA_Side side, FLA_Trans trans, FLA_Obj p, FLA_Obj A)
Definition: FLA_Apply_pivots.c:15
dim_t FLA_Obj_length(FLA_Obj obj)
Definition: FLA_Query.c:116
FLA_Error FLA_Amax_external(FLA_Obj x, FLA_Obj index)
Definition: FLA_Amax_external.c:13
FLA_Error FLA_Merge_2x1(FLA_Obj AT, FLA_Obj AB, FLA_Obj *A)
Definition: FLA_View.c:541