libflame  revision_anchor
Functions
FLA_Lyap_n_opt_var3.c File Reference

(r)

Functions

FLA_Error FLA_Lyap_n_opt_var3 (FLA_Obj isgn, FLA_Obj A, FLA_Obj C)
 
FLA_Error FLA_Lyap_n_ops_var3 (int m_AC, float *buff_sgn, float *buff_A, int rs_A, int cs_A, float *buff_W, int rs_W, int cs_W, float *buff_C, int rs_C, int cs_C)
 
FLA_Error FLA_Lyap_n_opd_var3 (int m_AC, double *buff_sgn, double *buff_A, int rs_A, int cs_A, double *buff_W, int rs_W, int cs_W, double *buff_C, int rs_C, int cs_C)
 
FLA_Error FLA_Lyap_n_opc_var3 (int m_AC, scomplex *buff_sgn, scomplex *buff_A, int rs_A, int cs_A, scomplex *buff_W, int rs_W, int cs_W, scomplex *buff_C, int rs_C, int cs_C)
 
FLA_Error FLA_Lyap_n_opz_var3 (int m_AC, dcomplex *buff_sgn, dcomplex *buff_A, int rs_A, int cs_A, dcomplex *buff_W, int rs_W, int cs_W, dcomplex *buff_C, int rs_C, int cs_C)
 

Function Documentation

◆ FLA_Lyap_n_opc_var3()

FLA_Error FLA_Lyap_n_opc_var3 ( int  m_AC,
scomplex buff_sgn,
scomplex buff_A,
int  rs_A,
int  cs_A,
scomplex buff_W,
int  rs_W,
int  cs_W,
scomplex buff_C,
int  rs_C,
int  cs_C 
)

References bl1_caxpysv(), bl1_ccopymrt(), bl1_cdot2s(), bl1_cgemv(), bl1_cscalm(), bl1_cshiftdiag(), bl1_ctrsv(), BLIS1_CONJUGATE, BLIS1_NO_CONJUGATE, BLIS1_NO_TRANSPOSE, BLIS1_NONUNIT_DIAG, BLIS1_UPPER_TRIANGULAR, FLA_MINUS_ONE, FLA_ONE, and i.

Referenced by FLA_Lyap_n_opt_var3().

348 {
349  scomplex* buff_1 = FLA_COMPLEX_PTR( FLA_ONE );
350  scomplex* buff_m1 = FLA_COMPLEX_PTR( FLA_MINUS_ONE );
351  int i;
352 
354  m_AC,
355  m_AC,
356  buff_sgn,
357  buff_C, rs_C, cs_C );
358 
359  for ( i = m_AC - 1; i >= 0; --i )
360  {
361  scomplex* A00 = buff_A + (0 )*cs_A + (0 )*rs_A;
362  scomplex* a01 = buff_A + (i )*cs_A + (0 )*rs_A;
363  scomplex* alpha11 = buff_A + (i )*cs_A + (i )*rs_A;
364  scomplex* A02 = buff_A + (i+1)*cs_A + (0 )*rs_A;
365  scomplex* a12t = buff_A + (i+1)*cs_A + (i )*rs_A;
366 
367  scomplex* c01 = buff_C + (i )*cs_C + (0 )*rs_C;
368  scomplex* gamma11 = buff_C + (i )*cs_C + (i )*rs_C;
369  scomplex* C02 = buff_C + (i+1)*cs_C + (0 )*rs_C;
370  scomplex* c12t = buff_C + (i+1)*cs_C + (i )*rs_C;
371 
372  scomplex* W00 = buff_W + (0 )*cs_W + (0 )*rs_W;
373 
374  scomplex omega;
375 
376  int m_behind = i;
377  int m_ahead = m_AC - i - 1;
378 
379  /*------------------------------------------------------------*/
380 
381  // FLA_Dot2cs( FLA_CONJUGATE, FLA_MINUS_ONE, a12t, c12t, FLA_ONE, gamma11 );
383  m_ahead,
384  buff_m1,
385  a12t, cs_A,
386  c12t, cs_C,
387  buff_1,
388  gamma11 );
389 
390  // FLA_Copyt( FLA_CONJ_NO_TRANSPOSE, alpha11, omega );
391  // FLA_Mult_add( FLA_ONE, alpha11, omega );
392  // FLA_Inv_scal( omega, gamma11 );
393  bl1_ccopyconj( alpha11, &omega );
394  bl1_cadd3( alpha11, &omega, &omega );
395  bl1_cinvscals( &omega, gamma11 );
396 
397  // FLA_Axpys( FLA_MINUS_ONE, gamma11, a01, FLA_ONE, c01 );
398  // FLA_Gemvc( FLA_NO_TRANSPOSE, FLA_CONJUGATE, FLA_MINUS_ONE, C02, a12t, FLA_ONE, c01 );
399  // FLA_Gemvc( FLA_NO_TRANSPOSE, FLA_CONJUGATE, FLA_MINUS_ONE, A02, c12t, FLA_ONE, c01 );
400  bl1_caxpysv( m_behind,
401  buff_m1,
402  gamma11,
403  a01, rs_A,
404  buff_1,
405  c01, rs_C );
406 
409  m_behind,
410  m_ahead,
411  buff_m1,
412  C02, rs_C, cs_C,
413  a12t, cs_A,
414  buff_1,
415  c01, rs_C );
416 
419  m_behind,
420  m_ahead,
421  buff_m1,
422  A02, rs_A, cs_A,
423  c12t, cs_C,
424  buff_1,
425  c01, rs_C );
426 
427  // FLA_Copyrt( FLA_UPPER_TRIANGULAR, FLA_NO_TRANSPOSE, A00, W00 );
428  // FLA_Shift_diag( FLA_CONJUGATE, alpha11, W00 );
429  // FLA_Trsv( FLA_UPPER_TRIANGULAR, FLA_NO_TRANSPOSE, FLA_NONUNIT_DIAG, W00, c01 );
432  m_behind,
433  m_behind,
434  A00, rs_A, cs_A,
435  W00, rs_W, cs_W );
436 
438  0,
439  m_behind,
440  m_behind,
441  alpha11,
442  W00, rs_W, cs_W );
443 
447  m_behind,
448  W00, rs_W, cs_W,
449  c01, rs_C );
450 
451  /*------------------------------------------------------------*/
452  }
453 
454  return FLA_SUCCESS;
455 }
void bl1_ctrsv(uplo1_t uplo, trans1_t trans, diag1_t diag, int m, scomplex *a, int a_rs, int a_cs, scomplex *x, int incx)
Definition: bl1_trsv.c:99
FLA_Obj FLA_MINUS_ONE
Definition: FLA_Init.c:22
Definition: blis_type_defs.h:81
Definition: blis_type_defs.h:82
FLA_Obj FLA_ONE
Definition: FLA_Init.c:18
Definition: blis_type_defs.h:54
Definition: blis_type_defs.h:132
void bl1_cscalm(conj1_t conj, int m, int n, scomplex *alpha, scomplex *a, int a_rs, int a_cs)
Definition: bl1_scalm.c:169
void bl1_caxpysv(int n, scomplex *alpha0, scomplex *alpha1, scomplex *x, int incx, scomplex *beta, scomplex *y, int incy)
Definition: bl1_axpysv.c:51
void bl1_cgemv(trans1_t transa, conj1_t conjx, int m, int n, scomplex *alpha, scomplex *a, int a_rs, int a_cs, scomplex *x, int incx, scomplex *beta, scomplex *y, int incy)
Definition: bl1_gemv.c:125
int i
Definition: bl1_axmyv2.c:145
Definition: blis_type_defs.h:74
void bl1_cshiftdiag(conj1_t conj, int offset, int m, int n, scomplex *sigma, scomplex *a, int a_rs, int a_cs)
Definition: bl1_shiftdiag.c:97
void bl1_ccopymrt(uplo1_t uplo, trans1_t trans, int m, int n, scomplex *a, int a_rs, int a_cs, scomplex *b, int b_rs, int b_cs)
Definition: bl1_copymrt.c:223
Definition: blis_type_defs.h:63
void bl1_cdot2s(conj1_t conj, int n, scomplex *alpha, scomplex *x, int incx, scomplex *y, int incy, scomplex *beta, scomplex *rho)
Definition: bl1_dot2s.c:39

◆ FLA_Lyap_n_opd_var3()

FLA_Error FLA_Lyap_n_opd_var3 ( int  m_AC,
double *  buff_sgn,
double *  buff_A,
int  rs_A,
int  cs_A,
double *  buff_W,
int  rs_W,
int  cs_W,
double *  buff_C,
int  rs_C,
int  cs_C 
)

References bl1_daxpysv(), bl1_dcopymrt(), bl1_ddot2s(), bl1_dgemv(), bl1_dscalm(), bl1_dshiftdiag(), bl1_dtrsv(), BLIS1_CONJUGATE, BLIS1_NO_CONJUGATE, BLIS1_NO_TRANSPOSE, BLIS1_NONUNIT_DIAG, BLIS1_UPPER_TRIANGULAR, FLA_MINUS_ONE, FLA_ONE, and i.

Referenced by FLA_Lyap_n_opt_var3().

232 {
233  double* buff_1 = FLA_DOUBLE_PTR( FLA_ONE );
234  double* buff_m1 = FLA_DOUBLE_PTR( FLA_MINUS_ONE );
235  int i;
236 
238  m_AC,
239  m_AC,
240  buff_sgn,
241  buff_C, rs_C, cs_C );
242 
243  for ( i = m_AC - 1; i >= 0; --i )
244  {
245  double* A00 = buff_A + (0 )*cs_A + (0 )*rs_A;
246  double* a01 = buff_A + (i )*cs_A + (0 )*rs_A;
247  double* alpha11 = buff_A + (i )*cs_A + (i )*rs_A;
248  double* A02 = buff_A + (i+1)*cs_A + (0 )*rs_A;
249  double* a12t = buff_A + (i+1)*cs_A + (i )*rs_A;
250 
251  double* c01 = buff_C + (i )*cs_C + (0 )*rs_C;
252  double* gamma11 = buff_C + (i )*cs_C + (i )*rs_C;
253  double* C02 = buff_C + (i+1)*cs_C + (0 )*rs_C;
254  double* c12t = buff_C + (i+1)*cs_C + (i )*rs_C;
255 
256  double* W00 = buff_W + (0 )*cs_W + (0 )*rs_W;
257 
258  double omega;
259 
260  int m_behind = i;
261  int m_ahead = m_AC - i - 1;
262 
263  /*------------------------------------------------------------*/
264 
265  // FLA_Dot2cs( FLA_CONJUGATE, FLA_MINUS_ONE, a12t, c12t, FLA_ONE, gamma11 );
267  m_ahead,
268  buff_m1,
269  a12t, cs_A,
270  c12t, cs_C,
271  buff_1,
272  gamma11 );
273 
274  // FLA_Copyt( FLA_CONJ_NO_TRANSPOSE, alpha11, omega );
275  // FLA_Mult_add( FLA_ONE, alpha11, omega );
276  // FLA_Inv_scal( omega, gamma11 );
277  bl1_dcopyconj( alpha11, &omega );
278  bl1_dadd3( alpha11, &omega, &omega );
279  bl1_dinvscals( &omega, gamma11 );
280 
281  // FLA_Axpys( FLA_MINUS_ONE, gamma11, a01, FLA_ONE, c01 );
282  // FLA_Gemvc( FLA_NO_TRANSPOSE, FLA_CONJUGATE, FLA_MINUS_ONE, C02, a12t, FLA_ONE, c01 );
283  // FLA_Gemvc( FLA_NO_TRANSPOSE, FLA_CONJUGATE, FLA_MINUS_ONE, A02, c12t, FLA_ONE, c01 );
284  bl1_daxpysv( m_behind,
285  buff_m1,
286  gamma11,
287  a01, rs_A,
288  buff_1,
289  c01, rs_C );
290 
293  m_behind,
294  m_ahead,
295  buff_m1,
296  C02, rs_C, cs_C,
297  a12t, cs_A,
298  buff_1,
299  c01, rs_C );
300 
303  m_behind,
304  m_ahead,
305  buff_m1,
306  A02, rs_A, cs_A,
307  c12t, cs_C,
308  buff_1,
309  c01, rs_C );
310 
311  // FLA_Copyrt( FLA_UPPER_TRIANGULAR, FLA_NO_TRANSPOSE, A00, W00 );
312  // FLA_Shift_diag( FLA_CONJUGATE, alpha11, W00 );
313  // FLA_Trsv( FLA_UPPER_TRIANGULAR, FLA_NO_TRANSPOSE, FLA_NONUNIT_DIAG, W00, c01 );
316  m_behind,
317  m_behind,
318  A00, rs_A, cs_A,
319  W00, rs_W, cs_W );
320 
322  0,
323  m_behind,
324  m_behind,
325  alpha11,
326  W00, rs_W, cs_W );
327 
331  m_behind,
332  W00, rs_W, cs_W,
333  c01, rs_C );
334 
335  /*------------------------------------------------------------*/
336  }
337 
338  return FLA_SUCCESS;
339 }
void bl1_dgemv(trans1_t transa, conj1_t conjx, int m, int n, double *alpha, double *a, int a_rs, int a_cs, double *x, int incx, double *beta, double *y, int incy)
Definition: bl1_gemv.c:69
FLA_Obj FLA_MINUS_ONE
Definition: FLA_Init.c:22
Definition: blis_type_defs.h:81
void bl1_daxpysv(int n, double *alpha0, double *alpha1, double *x, int incx, double *beta, double *y, int incy)
Definition: bl1_axpysv.c:32
void bl1_ddot2s(conj1_t conj, int n, double *alpha, double *x, int incx, double *y, int incy, double *beta, double *rho)
Definition: bl1_dot2s.c:26
Definition: blis_type_defs.h:82
FLA_Obj FLA_ONE
Definition: FLA_Init.c:18
void bl1_dcopymrt(uplo1_t uplo, trans1_t trans, int m, int n, double *a, int a_rs, int a_cs, double *b, int b_rs, int b_cs)
Definition: bl1_copymrt.c:118
Definition: blis_type_defs.h:54
void bl1_dtrsv(uplo1_t uplo, trans1_t trans, diag1_t diag, int m, double *a, int a_rs, int a_cs, double *x, int incx)
Definition: bl1_trsv.c:56
void bl1_dshiftdiag(conj1_t conj, int offset, int m, int n, double *sigma, double *a, int a_rs, int a_cs)
Definition: bl1_shiftdiag.c:34
int i
Definition: bl1_axmyv2.c:145
Definition: blis_type_defs.h:74
void bl1_dscalm(conj1_t conj, int m, int n, double *alpha, double *a, int a_rs, int a_cs)
Definition: bl1_scalm.c:65
Definition: blis_type_defs.h:63

◆ FLA_Lyap_n_ops_var3()

FLA_Error FLA_Lyap_n_ops_var3 ( int  m_AC,
float *  buff_sgn,
float *  buff_A,
int  rs_A,
int  cs_A,
float *  buff_W,
int  rs_W,
int  cs_W,
float *  buff_C,
int  rs_C,
int  cs_C 
)

References bl1_saxpysv(), bl1_scopymrt(), bl1_sdot2s(), bl1_sgemv(), bl1_sscalm(), bl1_sshiftdiag(), bl1_strsv(), BLIS1_CONJUGATE, BLIS1_NO_CONJUGATE, BLIS1_NO_TRANSPOSE, BLIS1_NONUNIT_DIAG, BLIS1_UPPER_TRIANGULAR, FLA_MINUS_ONE, FLA_ONE, and i.

Referenced by FLA_Lyap_n_opt_var3().

116 {
117  float* buff_1 = FLA_FLOAT_PTR( FLA_ONE );
118  float* buff_m1 = FLA_FLOAT_PTR( FLA_MINUS_ONE );
119  int i;
120 
122  m_AC,
123  m_AC,
124  buff_sgn,
125  buff_C, rs_C, cs_C );
126 
127  for ( i = m_AC - 1; i >= 0; --i )
128  {
129  float* A00 = buff_A + (0 )*cs_A + (0 )*rs_A;
130  float* a01 = buff_A + (i )*cs_A + (0 )*rs_A;
131  float* alpha11 = buff_A + (i )*cs_A + (i )*rs_A;
132  float* A02 = buff_A + (i+1)*cs_A + (0 )*rs_A;
133  float* a12t = buff_A + (i+1)*cs_A + (i )*rs_A;
134 
135  float* c01 = buff_C + (i )*cs_C + (0 )*rs_C;
136  float* gamma11 = buff_C + (i )*cs_C + (i )*rs_C;
137  float* C02 = buff_C + (i+1)*cs_C + (0 )*rs_C;
138  float* c12t = buff_C + (i+1)*cs_C + (i )*rs_C;
139 
140  float* W00 = buff_W + (0 )*cs_W + (0 )*rs_W;
141 
142  float omega;
143 
144  int m_behind = i;
145  int m_ahead = m_AC - i - 1;
146 
147  /*------------------------------------------------------------*/
148 
149  // FLA_Dot2cs( FLA_CONJUGATE, FLA_MINUS_ONE, a12t, c12t, FLA_ONE, gamma11 );
151  m_ahead,
152  buff_m1,
153  a12t, cs_A,
154  c12t, cs_C,
155  buff_1,
156  gamma11 );
157 
158  // FLA_Copyt( FLA_CONJ_NO_TRANSPOSE, alpha11, omega );
159  // FLA_Mult_add( FLA_ONE, alpha11, omega );
160  // FLA_Inv_scal( omega, gamma11 );
161  bl1_scopyconj( alpha11, &omega );
162  bl1_sadd3( alpha11, &omega, &omega );
163  bl1_sinvscals( &omega, gamma11 );
164 
165  // FLA_Axpys( FLA_MINUS_ONE, gamma11, a01, FLA_ONE, c01 );
166  // FLA_Gemvc( FLA_NO_TRANSPOSE, FLA_CONJUGATE, FLA_MINUS_ONE, C02, a12t, FLA_ONE, c01 );
167  // FLA_Gemvc( FLA_NO_TRANSPOSE, FLA_CONJUGATE, FLA_MINUS_ONE, A02, c12t, FLA_ONE, c01 );
168  bl1_saxpysv( m_behind,
169  buff_m1,
170  gamma11,
171  a01, rs_A,
172  buff_1,
173  c01, rs_C );
174 
177  m_behind,
178  m_ahead,
179  buff_m1,
180  C02, rs_C, cs_C,
181  a12t, cs_A,
182  buff_1,
183  c01, rs_C );
184 
187  m_behind,
188  m_ahead,
189  buff_m1,
190  A02, rs_A, cs_A,
191  c12t, cs_C,
192  buff_1,
193  c01, rs_C );
194 
195  // FLA_Copyrt( FLA_UPPER_TRIANGULAR, FLA_NO_TRANSPOSE, A00, W00 );
196  // FLA_Shift_diag( FLA_CONJUGATE, alpha11, W00 );
197  // FLA_Trsv( FLA_UPPER_TRIANGULAR, FLA_NO_TRANSPOSE, FLA_NONUNIT_DIAG, W00, c01 );
200  m_behind,
201  m_behind,
202  A00, rs_A, cs_A,
203  W00, rs_W, cs_W );
204 
206  0,
207  m_behind,
208  m_behind,
209  alpha11,
210  W00, rs_W, cs_W );
211 
215  m_behind,
216  W00, rs_W, cs_W,
217  c01, rs_C );
218 
219  /*------------------------------------------------------------*/
220  }
221 
222  return FLA_SUCCESS;
223 }
FLA_Obj FLA_MINUS_ONE
Definition: FLA_Init.c:22
Definition: blis_type_defs.h:81
void bl1_saxpysv(int n, float *alpha0, float *alpha1, float *x, int incx, float *beta, float *y, int incy)
Definition: bl1_axpysv.c:13
void bl1_sshiftdiag(conj1_t conj, int offset, int m, int n, float *sigma, float *a, int a_rs, int a_cs)
Definition: bl1_shiftdiag.c:13
void bl1_strsv(uplo1_t uplo, trans1_t trans, diag1_t diag, int m, float *a, int a_rs, int a_cs, float *x, int incx)
Definition: bl1_trsv.c:13
Definition: blis_type_defs.h:82
FLA_Obj FLA_ONE
Definition: FLA_Init.c:18
void bl1_sgemv(trans1_t transa, conj1_t conjx, int m, int n, float *alpha, float *a, int a_rs, int a_cs, float *x, int incx, float *beta, float *y, int incy)
Definition: bl1_gemv.c:13
void bl1_sscalm(conj1_t conj, int m, int n, float *alpha, float *a, int a_rs, int a_cs)
Definition: bl1_scalm.c:13
Definition: blis_type_defs.h:54
void bl1_scopymrt(uplo1_t uplo, trans1_t trans, int m, int n, float *a, int a_rs, int a_cs, float *b, int b_rs, int b_cs)
Definition: bl1_copymrt.c:13
void bl1_sdot2s(conj1_t conj, int n, float *alpha, float *x, int incx, float *y, int incy, float *beta, float *rho)
Definition: bl1_dot2s.c:13
int i
Definition: bl1_axmyv2.c:145
Definition: blis_type_defs.h:74
Definition: blis_type_defs.h:63

◆ FLA_Lyap_n_opt_var3()

FLA_Error FLA_Lyap_n_opt_var3 ( FLA_Obj  isgn,
FLA_Obj  A,
FLA_Obj  C 
)

References FLA_Lyap_n_opc_var3(), FLA_Lyap_n_opd_var3(), FLA_Lyap_n_ops_var3(), FLA_Lyap_n_opz_var3(), FLA_Obj_col_stride(), FLA_Obj_create_conf_to(), FLA_Obj_datatype(), FLA_Obj_free(), FLA_Obj_length(), and FLA_Obj_row_stride().

Referenced by FLA_Lyap_n().

14 {
15  FLA_Datatype datatype;
16  int m_AC;
17  int rs_A, cs_A;
18  int rs_W, cs_W;
19  int rs_C, cs_C;
20  FLA_Obj W;
21 
22  FLA_Obj_create_conf_to( FLA_NO_TRANSPOSE, A, &W );
23 
24  datatype = FLA_Obj_datatype( A );
25 
26  m_AC = FLA_Obj_length( A );
27 
28  rs_A = FLA_Obj_row_stride( A );
29  cs_A = FLA_Obj_col_stride( A );
30 
31  rs_W = FLA_Obj_row_stride( W );
32  cs_W = FLA_Obj_col_stride( W );
33 
34  rs_C = FLA_Obj_row_stride( C );
35  cs_C = FLA_Obj_col_stride( C );
36 
37  switch ( datatype )
38  {
39  case FLA_FLOAT:
40  {
41  float* buff_A = FLA_FLOAT_PTR( A );
42  float* buff_W = FLA_FLOAT_PTR( W );
43  float* buff_C = FLA_FLOAT_PTR( C );
44  float* buff_sgn = FLA_FLOAT_PTR( isgn );
45 
46  FLA_Lyap_n_ops_var3( m_AC,
47  buff_sgn,
48  buff_A, rs_A, cs_A,
49  buff_W, rs_W, cs_W,
50  buff_C, rs_C, cs_C );
51 
52  break;
53  }
54 
55  case FLA_DOUBLE:
56  {
57  double* buff_A = FLA_DOUBLE_PTR( A );
58  double* buff_W = FLA_DOUBLE_PTR( W );
59  double* buff_C = FLA_DOUBLE_PTR( C );
60  double* buff_sgn = FLA_DOUBLE_PTR( isgn );
61 
62  FLA_Lyap_n_opd_var3( m_AC,
63  buff_sgn,
64  buff_A, rs_A, cs_A,
65  buff_W, rs_W, cs_W,
66  buff_C, rs_C, cs_C );
67 
68  break;
69  }
70 
71  case FLA_COMPLEX:
72  {
73  scomplex* buff_A = FLA_COMPLEX_PTR( A );
74  scomplex* buff_W = FLA_COMPLEX_PTR( W );
75  scomplex* buff_C = FLA_COMPLEX_PTR( C );
76  scomplex* buff_sgn = FLA_COMPLEX_PTR( isgn );
77 
78  FLA_Lyap_n_opc_var3( m_AC,
79  buff_sgn,
80  buff_A, rs_A, cs_A,
81  buff_W, rs_W, cs_W,
82  buff_C, rs_C, cs_C );
83 
84  break;
85  }
86 
87  case FLA_DOUBLE_COMPLEX:
88  {
89  dcomplex* buff_A = FLA_DOUBLE_COMPLEX_PTR( A );
90  dcomplex* buff_W = FLA_DOUBLE_COMPLEX_PTR( W );
91  dcomplex* buff_C = FLA_DOUBLE_COMPLEX_PTR( C );
92  dcomplex* buff_sgn = FLA_DOUBLE_COMPLEX_PTR( isgn );
93 
94  FLA_Lyap_n_opz_var3( m_AC,
95  buff_sgn,
96  buff_A, rs_A, cs_A,
97  buff_W, rs_W, cs_W,
98  buff_C, rs_C, cs_C );
99 
100  break;
101  }
102  }
103 
104  FLA_Obj_free( &W );
105 
106  return FLA_SUCCESS;
107 }
FLA_Error FLA_Obj_free(FLA_Obj *obj)
Definition: FLA_Obj.c:588
dim_t FLA_Obj_row_stride(FLA_Obj obj)
Definition: FLA_Query.c:167
FLA_Datatype FLA_Obj_datatype(FLA_Obj obj)
Definition: FLA_Query.c:13
Definition: FLA_type_defs.h:158
FLA_Error FLA_Obj_create_conf_to(FLA_Trans trans, FLA_Obj old, FLA_Obj *obj)
Definition: FLA_Obj.c:286
Definition: blis_type_defs.h:132
FLA_Error FLA_Lyap_n_opd_var3(int m_AC, double *buff_sgn, double *buff_A, int rs_A, int cs_A, double *buff_W, int rs_W, int cs_W, double *buff_C, int rs_C, int cs_C)
Definition: FLA_Lyap_n_opt_var3.c:227
int FLA_Datatype
Definition: FLA_type_defs.h:49
FLA_Error FLA_Lyap_n_opc_var3(int m_AC, scomplex *buff_sgn, scomplex *buff_A, int rs_A, int cs_A, scomplex *buff_W, int rs_W, int cs_W, scomplex *buff_C, int rs_C, int cs_C)
Definition: FLA_Lyap_n_opt_var3.c:343
dim_t FLA_Obj_col_stride(FLA_Obj obj)
Definition: FLA_Query.c:174
FLA_Error FLA_Lyap_n_ops_var3(int m_AC, float *buff_sgn, float *buff_A, int rs_A, int cs_A, float *buff_W, int rs_W, int cs_W, float *buff_C, int rs_C, int cs_C)
Definition: FLA_Lyap_n_opt_var3.c:111
dim_t FLA_Obj_length(FLA_Obj obj)
Definition: FLA_Query.c:116
Definition: blis_type_defs.h:137
FLA_Error FLA_Lyap_n_opz_var3(int m_AC, dcomplex *buff_sgn, dcomplex *buff_A, int rs_A, int cs_A, dcomplex *buff_W, int rs_W, int cs_W, dcomplex *buff_C, int rs_C, int cs_C)
Definition: FLA_Lyap_n_opt_var3.c:459

◆ FLA_Lyap_n_opz_var3()

FLA_Error FLA_Lyap_n_opz_var3 ( int  m_AC,
dcomplex buff_sgn,
dcomplex buff_A,
int  rs_A,
int  cs_A,
dcomplex buff_W,
int  rs_W,
int  cs_W,
dcomplex buff_C,
int  rs_C,
int  cs_C 
)

References bl1_zaxpysv(), bl1_zcopymrt(), bl1_zdot2s(), bl1_zgemv(), bl1_zscalm(), bl1_zshiftdiag(), bl1_ztrsv(), BLIS1_CONJUGATE, BLIS1_NO_CONJUGATE, BLIS1_NO_TRANSPOSE, BLIS1_NONUNIT_DIAG, BLIS1_UPPER_TRIANGULAR, FLA_MINUS_ONE, FLA_ONE, and i.

Referenced by FLA_Lyap_n_opt_var3().

464 {
465  dcomplex* buff_1 = FLA_DOUBLE_COMPLEX_PTR( FLA_ONE );
466  dcomplex* buff_m1 = FLA_DOUBLE_COMPLEX_PTR( FLA_MINUS_ONE );
467  int i;
468 
470  m_AC,
471  m_AC,
472  buff_sgn,
473  buff_C, rs_C, cs_C );
474 
475  for ( i = m_AC - 1; i >= 0; --i )
476  {
477  dcomplex* A00 = buff_A + (0 )*cs_A + (0 )*rs_A;
478  dcomplex* a01 = buff_A + (i )*cs_A + (0 )*rs_A;
479  dcomplex* alpha11 = buff_A + (i )*cs_A + (i )*rs_A;
480  dcomplex* A02 = buff_A + (i+1)*cs_A + (0 )*rs_A;
481  dcomplex* a12t = buff_A + (i+1)*cs_A + (i )*rs_A;
482 
483  dcomplex* c01 = buff_C + (i )*cs_C + (0 )*rs_C;
484  dcomplex* gamma11 = buff_C + (i )*cs_C + (i )*rs_C;
485  dcomplex* C02 = buff_C + (i+1)*cs_C + (0 )*rs_C;
486  dcomplex* c12t = buff_C + (i+1)*cs_C + (i )*rs_C;
487 
488  dcomplex* W00 = buff_W + (0 )*cs_W + (0 )*rs_W;
489 
490  dcomplex omega;
491 
492  int m_behind = i;
493  int m_ahead = m_AC - i - 1;
494 
495  /*------------------------------------------------------------*/
496 
497  // FLA_Dot2cs( FLA_CONJUGATE, FLA_MINUS_ONE, a12t, c12t, FLA_ONE, gamma11 );
499  m_ahead,
500  buff_m1,
501  a12t, cs_A,
502  c12t, cs_C,
503  buff_1,
504  gamma11 );
505 
506  // FLA_Copyt( FLA_CONJ_NO_TRANSPOSE, alpha11, omega );
507  // FLA_Mult_add( FLA_ONE, alpha11, omega );
508  // FLA_Inv_scal( omega, gamma11 );
509  bl1_zcopyconj( alpha11, &omega );
510  bl1_zadd3( alpha11, &omega, &omega );
511  bl1_zinvscals( &omega, gamma11 );
512 
513  // FLA_Axpys( FLA_MINUS_ONE, gamma11, a01, FLA_ONE, c01 );
514  // FLA_Gemvc( FLA_NO_TRANSPOSE, FLA_CONJUGATE, FLA_MINUS_ONE, C02, a12t, FLA_ONE, c01 );
515  // FLA_Gemvc( FLA_NO_TRANSPOSE, FLA_CONJUGATE, FLA_MINUS_ONE, A02, c12t, FLA_ONE, c01 );
516  bl1_zaxpysv( m_behind,
517  buff_m1,
518  gamma11,
519  a01, rs_A,
520  buff_1,
521  c01, rs_C );
522 
525  m_behind,
526  m_ahead,
527  buff_m1,
528  C02, rs_C, cs_C,
529  a12t, cs_A,
530  buff_1,
531  c01, rs_C );
532 
535  m_behind,
536  m_ahead,
537  buff_m1,
538  A02, rs_A, cs_A,
539  c12t, cs_C,
540  buff_1,
541  c01, rs_C );
542 
543  // FLA_Copyrt( FLA_UPPER_TRIANGULAR, FLA_NO_TRANSPOSE, A00, W00 );
544  // FLA_Shift_diag( FLA_CONJUGATE, alpha11, W00 );
545  // FLA_Trsv( FLA_UPPER_TRIANGULAR, FLA_NO_TRANSPOSE, FLA_NONUNIT_DIAG, W00, c01 );
548  m_behind,
549  m_behind,
550  A00, rs_A, cs_A,
551  W00, rs_W, cs_W );
552 
554  0,
555  m_behind,
556  m_behind,
557  alpha11,
558  W00, rs_W, cs_W );
559 
563  m_behind,
564  W00, rs_W, cs_W,
565  c01, rs_C );
566 
567  /*------------------------------------------------------------*/
568  }
569 
570  return FLA_SUCCESS;
571 }
FLA_Obj FLA_MINUS_ONE
Definition: FLA_Init.c:22
Definition: blis_type_defs.h:81
void bl1_zdot2s(conj1_t conj, int n, dcomplex *alpha, dcomplex *x, int incx, dcomplex *y, int incy, dcomplex *beta, dcomplex *rho)
Definition: bl1_dot2s.c:70
void bl1_zscalm(conj1_t conj, int m, int n, dcomplex *alpha, dcomplex *a, int a_rs, int a_cs)
Definition: bl1_scalm.c:273
Definition: blis_type_defs.h:82
void bl1_zshiftdiag(conj1_t conj, int offset, int m, int n, dcomplex *sigma, dcomplex *a, int a_rs, int a_cs)
Definition: bl1_shiftdiag.c:122
FLA_Obj FLA_ONE
Definition: FLA_Init.c:18
void bl1_zaxpysv(int n, dcomplex *alpha0, dcomplex *alpha1, dcomplex *x, int incx, dcomplex *beta, dcomplex *y, int incy)
Definition: bl1_axpysv.c:71
Definition: blis_type_defs.h:54
void bl1_zgemv(trans1_t transa, conj1_t conjx, int m, int n, dcomplex *alpha, dcomplex *a, int a_rs, int a_cs, dcomplex *x, int incx, dcomplex *beta, dcomplex *y, int incy)
Definition: bl1_gemv.c:255
int i
Definition: bl1_axmyv2.c:145
void bl1_zcopymrt(uplo1_t uplo, trans1_t trans, int m, int n, dcomplex *a, int a_rs, int a_cs, dcomplex *b, int b_rs, int b_cs)
Definition: bl1_copymrt.c:328
Definition: blis_type_defs.h:74
Definition: blis_type_defs.h:63
Definition: blis_type_defs.h:137
void bl1_ztrsv(uplo1_t uplo, trans1_t trans, diag1_t diag, int m, dcomplex *a, int a_rs, int a_cs, dcomplex *x, int incx)
Definition: bl1_trsv.c:177