libflame  revision_anchor
Functions
FLA_Eig_gest_il_opt_var3.c File Reference

(r)

Functions

FLA_Error FLA_Eig_gest_il_opt_var3 (FLA_Obj A, FLA_Obj Y, FLA_Obj B)
 
FLA_Error FLA_Eig_gest_il_ops_var3 (int m_AB, float *buff_A, int rs_A, int cs_A, float *buff_Y, int rs_Y, int cs_Y, float *buff_B, int rs_B, int cs_B)
 
FLA_Error FLA_Eig_gest_il_opd_var3 (int m_AB, double *buff_A, int rs_A, int cs_A, double *buff_Y, int rs_Y, int cs_Y, double *buff_B, int rs_B, int cs_B)
 
FLA_Error FLA_Eig_gest_il_opc_var3 (int m_AB, scomplex *buff_A, int rs_A, int cs_A, scomplex *buff_Y, int rs_Y, int cs_Y, scomplex *buff_B, int rs_B, int cs_B)
 
FLA_Error FLA_Eig_gest_il_opz_var3 (int m_AB, dcomplex *buff_A, int rs_A, int cs_A, dcomplex *buff_Y, int rs_Y, int cs_Y, dcomplex *buff_B, int rs_B, int cs_B)
 

Function Documentation

◆ FLA_Eig_gest_il_opc_var3()

FLA_Error FLA_Eig_gest_il_opc_var3 ( int  m_AB,
scomplex buff_A,
int  rs_A,
int  cs_A,
scomplex buff_Y,
int  rs_Y,
int  cs_Y,
scomplex buff_B,
int  rs_B,
int  cs_B 
)
352 {
353  scomplex* buff_1 = FLA_COMPLEX_PTR( FLA_ONE );
354  scomplex* buff_m1 = FLA_COMPLEX_PTR( FLA_MINUS_ONE );
355  scomplex* buff_m1h = FLA_COMPLEX_PTR( FLA_MINUS_ONE_HALF );
356  int i;
357 
358  for ( i = 0; i < m_AB; ++i )
359  {
360  scomplex* a10t = buff_A + (0 )*cs_A + (i )*rs_A;
361  scomplex* A20 = buff_A + (0 )*cs_A + (i+1)*rs_A;
362  scomplex* alpha11 = buff_A + (i )*cs_A + (i )*rs_A;
363  scomplex* a21 = buff_A + (i )*cs_A + (i+1)*rs_A;
364 
365  scomplex* y10t = buff_Y + (0 )*cs_Y + (i )*rs_Y;
366  scomplex* Y20 = buff_Y + (0 )*cs_Y + (i+1)*rs_Y;
367  scomplex* y21 = buff_Y + (i )*cs_Y + (i+1)*rs_Y;
368 
369  scomplex* b10t = buff_B + (0 )*cs_B + (i )*rs_B;
370  scomplex* B20 = buff_B + (0 )*cs_B + (i+1)*rs_B;
371  scomplex* beta11 = buff_B + (i )*cs_B + (i )*rs_B;
372  scomplex* b21 = buff_B + (i )*cs_B + (i+1)*rs_B;
373 
374  int m_ahead = m_AB - i - 1;
375  int m_behind = i;
376 
377  /*------------------------------------------------------------*/
378 
379  // FLA_Axpy_external( FLA_MINUS_ONE_HALF, y10t, a10t );
381  m_behind,
382  buff_m1h,
383  y10t, cs_Y,
384  a10t, cs_A );
385 
386  // FLA_Dot2cs_external( FLA_CONJUGATE, FLA_MINUS_ONE, a10t, b10t, FLA_ONE, alpha11 );
388  m_behind,
389  buff_m1,
390  a10t, cs_A,
391  b10t, cs_B,
392  buff_1,
393  alpha11 );
394 
395  // FLA_Inv_scal_external( beta11, alpha11 );
396  // FLA_Inv_scal_external( beta11, alpha11 );
397  bl1_cinvscals( beta11, alpha11 );
398  bl1_cinvscals( beta11, alpha11 );
399 
400  // FLA_Gemvc_external( FLA_NO_TRANSPOSE, FLA_CONJUGATE,
401  // FLA_MINUS_ONE, A20, b10t, FLA_ONE, a21 );
404  m_ahead,
405  m_behind,
406  buff_m1,
407  A20, rs_A, cs_A,
408  b10t, cs_B,
409  buff_1,
410  a21, rs_A );
411 
412  // FLA_Inv_scal_external( beta11, a21 );
414  m_ahead,
415  beta11,
416  a21, rs_A );
417 
418  // FLA_Axpy_external( FLA_MINUS_ONE_HALF, y10t, a10t );
420  m_behind,
421  buff_m1h,
422  y10t, cs_Y,
423  a10t, cs_A );
424 
425  // FLA_Inv_scal_external( beta11, a10t );
427  m_behind,
428  beta11,
429  a10t, cs_A );
430 
431  // FLA_Ger_external( FLA_ONE, b21, a10t, Y20 );
434  m_ahead,
435  m_behind,
436  buff_1,
437  b21, rs_B,
438  a10t, cs_A,
439  Y20, rs_Y, cs_Y );
440 
441  // FLA_Copy_external( b21, y21 );
442  // FLA_Scal_external( alpha11, y21 );
444  m_ahead,
445  b21, rs_B,
446  y21, rs_Y );
448  m_ahead,
449  alpha11,
450  y21, rs_Y );
451 
452  // FLA_Gemvc_external( FLA_NO_TRANSPOSE, FLA_CONJUGATE,
453  // FLA_ONE, B20, a10t, FLA_ONE, y21 );
456  m_ahead,
457  m_behind,
458  buff_1,
459  B20, rs_B, cs_B,
460  a10t, cs_A,
461  buff_1,
462  y21, rs_Y );
463 
464  /*------------------------------------------------------------*/
465 
466  }
467 
468  return FLA_SUCCESS;
469 }
FLA_Obj FLA_MINUS_ONE_HALF
Definition: FLA_Init.c:21
FLA_Obj FLA_MINUS_ONE
Definition: FLA_Init.c:22
FLA_Obj FLA_ONE
Definition: FLA_Init.c:18
int i
Definition: bl1_axmyv2.c:145
void bl1_caxpyv(conj1_t conj, int n, scomplex *alpha, scomplex *x, int incx, scomplex *y, int incy)
Definition: bl1_axpyv.c:29
void bl1_ccopyv(conj1_t conj, int m, scomplex *x, int incx, scomplex *y, int incy)
Definition: bl1_copyv.c:49
void bl1_cdot2s(conj1_t conj, int n, scomplex *alpha, scomplex *x, int incx, scomplex *y, int incy, scomplex *beta, scomplex *rho)
Definition: bl1_dot2s.c:39
void bl1_cgemv(trans1_t transa, conj1_t conjx, int m, int n, scomplex *alpha, scomplex *a, int a_rs, int a_cs, scomplex *x, int incx, scomplex *beta, scomplex *y, int incy)
Definition: bl1_gemv.c:125
void bl1_cger(conj1_t conjx, conj1_t conjy, int m, int n, scomplex *alpha, scomplex *x, int incx, scomplex *y, int incy, scomplex *a, int a_rs, int a_cs)
Definition: bl1_ger.c:111
void bl1_cinvscalv(conj1_t conj, int n, scomplex *alpha, scomplex *x, int incx)
Definition: bl1_invscalv.c:52
void bl1_cscalv(conj1_t conj, int n, scomplex *alpha, scomplex *x, int incx)
Definition: bl1_scalv.c:46
@ BLIS1_NO_TRANSPOSE
Definition: blis_type_defs.h:54
@ BLIS1_CONJUGATE
Definition: blis_type_defs.h:82
@ BLIS1_NO_CONJUGATE
Definition: blis_type_defs.h:81
Definition: blis_type_defs.h:133

References bl1_caxpyv(), bl1_ccopyv(), bl1_cdot2s(), bl1_cgemv(), bl1_cger(), bl1_cinvscalv(), bl1_cscalv(), BLIS1_CONJUGATE, BLIS1_NO_CONJUGATE, BLIS1_NO_TRANSPOSE, FLA_MINUS_ONE, FLA_MINUS_ONE_HALF, FLA_ONE, and i.

Referenced by FLA_Eig_gest_il_opt_var3().

◆ FLA_Eig_gest_il_opd_var3()

FLA_Error FLA_Eig_gest_il_opd_var3 ( int  m_AB,
double *  buff_A,
int  rs_A,
int  cs_A,
double *  buff_Y,
int  rs_Y,
int  cs_Y,
double *  buff_B,
int  rs_B,
int  cs_B 
)
227 {
228  double* buff_1 = FLA_DOUBLE_PTR( FLA_ONE );
229  double* buff_m1 = FLA_DOUBLE_PTR( FLA_MINUS_ONE );
230  double* buff_m1h = FLA_DOUBLE_PTR( FLA_MINUS_ONE_HALF );
231  int i;
232 
233  for ( i = 0; i < m_AB; ++i )
234  {
235  double* a10t = buff_A + (0 )*cs_A + (i )*rs_A;
236  double* A20 = buff_A + (0 )*cs_A + (i+1)*rs_A;
237  double* alpha11 = buff_A + (i )*cs_A + (i )*rs_A;
238  double* a21 = buff_A + (i )*cs_A + (i+1)*rs_A;
239 
240  double* y10t = buff_Y + (0 )*cs_Y + (i )*rs_Y;
241  double* Y20 = buff_Y + (0 )*cs_Y + (i+1)*rs_Y;
242  double* y21 = buff_Y + (i )*cs_Y + (i+1)*rs_Y;
243 
244  double* b10t = buff_B + (0 )*cs_B + (i )*rs_B;
245  double* B20 = buff_B + (0 )*cs_B + (i+1)*rs_B;
246  double* beta11 = buff_B + (i )*cs_B + (i )*rs_B;
247  double* b21 = buff_B + (i )*cs_B + (i+1)*rs_B;
248 
249  int m_ahead = m_AB - i - 1;
250  int m_behind = i;
251 
252  /*------------------------------------------------------------*/
253 
254  // FLA_Axpy_external( FLA_MINUS_ONE_HALF, y10t, a10t );
256  m_behind,
257  buff_m1h,
258  y10t, cs_Y,
259  a10t, cs_A );
260 
261  // FLA_Dot2cs_external( FLA_CONJUGATE, FLA_MINUS_ONE, a10t, b10t, FLA_ONE, alpha11 );
263  m_behind,
264  buff_m1,
265  a10t, cs_A,
266  b10t, cs_B,
267  buff_1,
268  alpha11 );
269 
270  // FLA_Inv_scal_external( beta11, alpha11 );
271  // FLA_Inv_scal_external( beta11, alpha11 );
272  bl1_dinvscals( beta11, alpha11 );
273  bl1_dinvscals( beta11, alpha11 );
274 
275  // FLA_Gemvc_external( FLA_NO_TRANSPOSE, FLA_CONJUGATE,
276  // FLA_MINUS_ONE, A20, b10t, FLA_ONE, a21 );
279  m_ahead,
280  m_behind,
281  buff_m1,
282  A20, rs_A, cs_A,
283  b10t, cs_B,
284  buff_1,
285  a21, rs_A );
286 
287  // FLA_Inv_scal_external( beta11, a21 );
289  m_ahead,
290  beta11,
291  a21, rs_A );
292 
293  // FLA_Axpy_external( FLA_MINUS_ONE_HALF, y10t, a10t );
295  m_behind,
296  buff_m1h,
297  y10t, cs_Y,
298  a10t, cs_A );
299 
300  // FLA_Inv_scal_external( beta11, a10t );
302  m_behind,
303  beta11,
304  a10t, cs_A );
305 
306  // FLA_Ger_external( FLA_ONE, b21, a10t, Y20 );
309  m_ahead,
310  m_behind,
311  buff_1,
312  b21, rs_B,
313  a10t, cs_A,
314  Y20, rs_Y, cs_Y );
315 
316  // FLA_Copy_external( b21, y21 );
317  // FLA_Scal_external( alpha11, y21 );
319  m_ahead,
320  b21, rs_B,
321  y21, rs_Y );
323  m_ahead,
324  alpha11,
325  y21, rs_Y );
326 
327  // FLA_Gemvc_external( FLA_NO_TRANSPOSE, FLA_CONJUGATE,
328  // FLA_ONE, B20, a10t, FLA_ONE, y21 );
331  m_ahead,
332  m_behind,
333  buff_1,
334  B20, rs_B, cs_B,
335  a10t, cs_A,
336  buff_1,
337  y21, rs_Y );
338 
339  /*------------------------------------------------------------*/
340 
341  }
342 
343  return FLA_SUCCESS;
344 }
void bl1_daxpyv(conj1_t conj, int n, double *alpha, double *x, int incx, double *y, int incy)
Definition: bl1_axpyv.c:21
void bl1_dcopyv(conj1_t conj, int m, double *x, int incx, double *y, int incy)
Definition: bl1_copyv.c:42
void bl1_ddot2s(conj1_t conj, int n, double *alpha, double *x, int incx, double *y, int incy, double *beta, double *rho)
Definition: bl1_dot2s.c:26
void bl1_dgemv(trans1_t transa, conj1_t conjx, int m, int n, double *alpha, double *a, int a_rs, int a_cs, double *x, int incx, double *beta, double *y, int incy)
Definition: bl1_gemv.c:69
void bl1_dger(conj1_t conjx, conj1_t conjy, int m, int n, double *alpha, double *x, int incx, double *y, int incy, double *a, int a_rs, int a_cs)
Definition: bl1_ger.c:62
void bl1_dinvscalv(conj1_t conj, int n, double *alpha, double *x, int incx)
Definition: bl1_invscalv.c:26
void bl1_dscalv(conj1_t conj, int n, double *alpha, double *x, int incx)
Definition: bl1_scalv.c:24

References bl1_daxpyv(), bl1_dcopyv(), bl1_ddot2s(), bl1_dgemv(), bl1_dger(), bl1_dinvscalv(), bl1_dscalv(), BLIS1_CONJUGATE, BLIS1_NO_CONJUGATE, BLIS1_NO_TRANSPOSE, FLA_MINUS_ONE, FLA_MINUS_ONE_HALF, FLA_ONE, and i.

Referenced by FLA_Eig_gest_il_opt_var3().

◆ FLA_Eig_gest_il_ops_var3()

FLA_Error FLA_Eig_gest_il_ops_var3 ( int  m_AB,
float *  buff_A,
int  rs_A,
int  cs_A,
float *  buff_Y,
int  rs_Y,
int  cs_Y,
float *  buff_B,
int  rs_B,
int  cs_B 
)
102 {
103  float* buff_1 = FLA_FLOAT_PTR( FLA_ONE );
104  float* buff_m1 = FLA_FLOAT_PTR( FLA_MINUS_ONE );
105  float* buff_m1h = FLA_FLOAT_PTR( FLA_MINUS_ONE_HALF );
106  int i;
107 
108  for ( i = 0; i < m_AB; ++i )
109  {
110  float* a10t = buff_A + (0 )*cs_A + (i )*rs_A;
111  float* A20 = buff_A + (0 )*cs_A + (i+1)*rs_A;
112  float* alpha11 = buff_A + (i )*cs_A + (i )*rs_A;
113  float* a21 = buff_A + (i )*cs_A + (i+1)*rs_A;
114 
115  float* y10t = buff_Y + (0 )*cs_Y + (i )*rs_Y;
116  float* Y20 = buff_Y + (0 )*cs_Y + (i+1)*rs_Y;
117  float* y21 = buff_Y + (i )*cs_Y + (i+1)*rs_Y;
118 
119  float* b10t = buff_B + (0 )*cs_B + (i )*rs_B;
120  float* B20 = buff_B + (0 )*cs_B + (i+1)*rs_B;
121  float* beta11 = buff_B + (i )*cs_B + (i )*rs_B;
122  float* b21 = buff_B + (i )*cs_B + (i+1)*rs_B;
123 
124  int m_ahead = m_AB - i - 1;
125  int m_behind = i;
126 
127  /*------------------------------------------------------------*/
128 
129  // FLA_Axpy_external( FLA_MINUS_ONE_HALF, y10t, a10t );
131  m_behind,
132  buff_m1h,
133  y10t, cs_Y,
134  a10t, cs_A );
135 
136  // FLA_Dot2cs_external( FLA_CONJUGATE, FLA_MINUS_ONE, a10t, b10t, FLA_ONE, alpha11 );
138  m_behind,
139  buff_m1,
140  a10t, cs_A,
141  b10t, cs_B,
142  buff_1,
143  alpha11 );
144 
145  // FLA_Inv_scal_external( beta11, alpha11 );
146  // FLA_Inv_scal_external( beta11, alpha11 );
147  bl1_sinvscals( beta11, alpha11 );
148  bl1_sinvscals( beta11, alpha11 );
149 
150  // FLA_Gemvc_external( FLA_NO_TRANSPOSE, FLA_CONJUGATE,
151  // FLA_MINUS_ONE, A20, b10t, FLA_ONE, a21 );
154  m_ahead,
155  m_behind,
156  buff_m1,
157  A20, rs_A, cs_A,
158  b10t, cs_B,
159  buff_1,
160  a21, rs_A );
161 
162  // FLA_Inv_scal_external( beta11, a21 );
164  m_ahead,
165  beta11,
166  a21, rs_A );
167 
168  // FLA_Axpy_external( FLA_MINUS_ONE_HALF, y10t, a10t );
170  m_behind,
171  buff_m1h,
172  y10t, cs_Y,
173  a10t, cs_A );
174 
175  // FLA_Inv_scal_external( beta11, a10t );
177  m_behind,
178  beta11,
179  a10t, cs_A );
180 
181  // FLA_Ger_external( FLA_ONE, b21, a10t, Y20 );
184  m_ahead,
185  m_behind,
186  buff_1,
187  b21, rs_B,
188  a10t, cs_A,
189  Y20, rs_Y, cs_Y );
190 
191  // FLA_Copy_external( b21, y21 );
192  // FLA_Scal_external( alpha11, y21 );
194  m_ahead,
195  b21, rs_B,
196  y21, rs_Y );
198  m_ahead,
199  alpha11,
200  y21, rs_Y );
201 
202  // FLA_Gemvc_external( FLA_NO_TRANSPOSE, FLA_CONJUGATE,
203  // FLA_ONE, B20, a10t, FLA_ONE, y21 );
206  m_ahead,
207  m_behind,
208  buff_1,
209  B20, rs_B, cs_B,
210  a10t, cs_A,
211  buff_1,
212  y21, rs_Y );
213 
214  /*------------------------------------------------------------*/
215 
216  }
217 
218  return FLA_SUCCESS;
219 }
void bl1_saxpyv(conj1_t conj, int n, float *alpha, float *x, int incx, float *y, int incy)
Definition: bl1_axpyv.c:13
void bl1_scopyv(conj1_t conj, int m, float *x, int incx, float *y, int incy)
Definition: bl1_copyv.c:35
void bl1_sdot2s(conj1_t conj, int n, float *alpha, float *x, int incx, float *y, int incy, float *beta, float *rho)
Definition: bl1_dot2s.c:13
void bl1_sgemv(trans1_t transa, conj1_t conjx, int m, int n, float *alpha, float *a, int a_rs, int a_cs, float *x, int incx, float *beta, float *y, int incy)
Definition: bl1_gemv.c:13
void bl1_sger(conj1_t conjx, conj1_t conjy, int m, int n, float *alpha, float *x, int incx, float *y, int incy, float *a, int a_rs, int a_cs)
Definition: bl1_ger.c:13
void bl1_sinvscalv(conj1_t conj, int n, float *alpha, float *x, int incx)
Definition: bl1_invscalv.c:13
void bl1_sscalv(conj1_t conj, int n, float *alpha, float *x, int incx)
Definition: bl1_scalv.c:13

References bl1_saxpyv(), bl1_scopyv(), bl1_sdot2s(), bl1_sgemv(), bl1_sger(), bl1_sinvscalv(), bl1_sscalv(), BLIS1_CONJUGATE, BLIS1_NO_CONJUGATE, BLIS1_NO_TRANSPOSE, FLA_MINUS_ONE, FLA_MINUS_ONE_HALF, FLA_ONE, and i.

Referenced by FLA_Eig_gest_il_opt_var3().

◆ FLA_Eig_gest_il_opt_var3()

FLA_Error FLA_Eig_gest_il_opt_var3 ( FLA_Obj  A,
FLA_Obj  Y,
FLA_Obj  B 
)
14 {
15  FLA_Datatype datatype;
16  int m_AB;
17  int rs_A, cs_A;
18  int rs_Y, cs_Y;
19  int rs_B, cs_B;
20 
21  datatype = FLA_Obj_datatype( A );
22 
23  m_AB = FLA_Obj_length( A );
24 
25  rs_A = FLA_Obj_row_stride( A );
26  cs_A = FLA_Obj_col_stride( A );
27 
28  rs_Y = FLA_Obj_row_stride( Y );
29  cs_Y = FLA_Obj_col_stride( Y );
30 
31  rs_B = FLA_Obj_row_stride( B );
32  cs_B = FLA_Obj_col_stride( B );
33 
34  switch ( datatype )
35  {
36  case FLA_FLOAT:
37  {
38  float* buff_A = FLA_FLOAT_PTR( A );
39  float* buff_Y = FLA_FLOAT_PTR( Y );
40  float* buff_B = FLA_FLOAT_PTR( B );
41 
43  buff_A, rs_A, cs_A,
44  buff_Y, rs_Y, cs_Y,
45  buff_B, rs_B, cs_B );
46 
47  break;
48  }
49 
50  case FLA_DOUBLE:
51  {
52  double* buff_A = FLA_DOUBLE_PTR( A );
53  double* buff_Y = FLA_DOUBLE_PTR( Y );
54  double* buff_B = FLA_DOUBLE_PTR( B );
55 
57  buff_A, rs_A, cs_A,
58  buff_Y, rs_Y, cs_Y,
59  buff_B, rs_B, cs_B );
60 
61  break;
62  }
63 
64  case FLA_COMPLEX:
65  {
66  scomplex* buff_A = FLA_COMPLEX_PTR( A );
67  scomplex* buff_Y = FLA_COMPLEX_PTR( Y );
68  scomplex* buff_B = FLA_COMPLEX_PTR( B );
69 
71  buff_A, rs_A, cs_A,
72  buff_Y, rs_Y, cs_Y,
73  buff_B, rs_B, cs_B );
74 
75  break;
76  }
77 
78  case FLA_DOUBLE_COMPLEX:
79  {
80  dcomplex* buff_A = FLA_DOUBLE_COMPLEX_PTR( A );
81  dcomplex* buff_Y = FLA_DOUBLE_COMPLEX_PTR( Y );
82  dcomplex* buff_B = FLA_DOUBLE_COMPLEX_PTR( B );
83 
85  buff_A, rs_A, cs_A,
86  buff_Y, rs_Y, cs_Y,
87  buff_B, rs_B, cs_B );
88 
89  break;
90  }
91  }
92 
93  return FLA_SUCCESS;
94 }
FLA_Error FLA_Eig_gest_il_opd_var3(int m_AB, double *buff_A, int rs_A, int cs_A, double *buff_Y, int rs_Y, int cs_Y, double *buff_B, int rs_B, int cs_B)
Definition: FLA_Eig_gest_il_opt_var3.c:223
FLA_Error FLA_Eig_gest_il_ops_var3(int m_AB, float *buff_A, int rs_A, int cs_A, float *buff_Y, int rs_Y, int cs_Y, float *buff_B, int rs_B, int cs_B)
Definition: FLA_Eig_gest_il_opt_var3.c:98
FLA_Error FLA_Eig_gest_il_opz_var3(int m_AB, dcomplex *buff_A, int rs_A, int cs_A, dcomplex *buff_Y, int rs_Y, int cs_Y, dcomplex *buff_B, int rs_B, int cs_B)
Definition: FLA_Eig_gest_il_opt_var3.c:473
FLA_Error FLA_Eig_gest_il_opc_var3(int m_AB, scomplex *buff_A, int rs_A, int cs_A, scomplex *buff_Y, int rs_Y, int cs_Y, scomplex *buff_B, int rs_B, int cs_B)
Definition: FLA_Eig_gest_il_opt_var3.c:348
dim_t FLA_Obj_row_stride(FLA_Obj obj)
Definition: FLA_Query.c:167
dim_t FLA_Obj_length(FLA_Obj obj)
Definition: FLA_Query.c:116
dim_t FLA_Obj_col_stride(FLA_Obj obj)
Definition: FLA_Query.c:174
FLA_Datatype FLA_Obj_datatype(FLA_Obj obj)
Definition: FLA_Query.c:13
int FLA_Datatype
Definition: FLA_type_defs.h:49
Definition: blis_type_defs.h:138

References FLA_Eig_gest_il_opc_var3(), FLA_Eig_gest_il_opd_var3(), FLA_Eig_gest_il_ops_var3(), FLA_Eig_gest_il_opz_var3(), FLA_Obj_col_stride(), FLA_Obj_datatype(), FLA_Obj_length(), and FLA_Obj_row_stride().

Referenced by FLA_Eig_gest_il().

◆ FLA_Eig_gest_il_opz_var3()

FLA_Error FLA_Eig_gest_il_opz_var3 ( int  m_AB,
dcomplex buff_A,
int  rs_A,
int  cs_A,
dcomplex buff_Y,
int  rs_Y,
int  cs_Y,
dcomplex buff_B,
int  rs_B,
int  cs_B 
)
477 {
478  dcomplex* buff_1 = FLA_DOUBLE_COMPLEX_PTR( FLA_ONE );
479  dcomplex* buff_m1 = FLA_DOUBLE_COMPLEX_PTR( FLA_MINUS_ONE );
480  dcomplex* buff_m1h = FLA_DOUBLE_COMPLEX_PTR( FLA_MINUS_ONE_HALF );
481  int i;
482 
483  for ( i = 0; i < m_AB; ++i )
484  {
485  dcomplex* a10t = buff_A + (0 )*cs_A + (i )*rs_A;
486  dcomplex* A20 = buff_A + (0 )*cs_A + (i+1)*rs_A;
487  dcomplex* alpha11 = buff_A + (i )*cs_A + (i )*rs_A;
488  dcomplex* a21 = buff_A + (i )*cs_A + (i+1)*rs_A;
489 
490  dcomplex* y10t = buff_Y + (0 )*cs_Y + (i )*rs_Y;
491  dcomplex* Y20 = buff_Y + (0 )*cs_Y + (i+1)*rs_Y;
492  dcomplex* y21 = buff_Y + (i )*cs_Y + (i+1)*rs_Y;
493 
494  dcomplex* b10t = buff_B + (0 )*cs_B + (i )*rs_B;
495  dcomplex* B20 = buff_B + (0 )*cs_B + (i+1)*rs_B;
496  dcomplex* beta11 = buff_B + (i )*cs_B + (i )*rs_B;
497  dcomplex* b21 = buff_B + (i )*cs_B + (i+1)*rs_B;
498 
499  int m_ahead = m_AB - i - 1;
500  int m_behind = i;
501 
502  /*------------------------------------------------------------*/
503 
504  // FLA_Axpy_external( FLA_MINUS_ONE_HALF, y10t, a10t );
506  m_behind,
507  buff_m1h,
508  y10t, cs_Y,
509  a10t, cs_A );
510 
511  // FLA_Dot2cs_external( FLA_CONJUGATE, FLA_MINUS_ONE, a10t, b10t, FLA_ONE, alpha11 );
513  m_behind,
514  buff_m1,
515  a10t, cs_A,
516  b10t, cs_B,
517  buff_1,
518  alpha11 );
519 
520  // FLA_Inv_scal_external( beta11, alpha11 );
521  // FLA_Inv_scal_external( beta11, alpha11 );
522  bl1_zinvscals( beta11, alpha11 );
523  bl1_zinvscals( beta11, alpha11 );
524 
525  // FLA_Gemvc_external( FLA_NO_TRANSPOSE, FLA_CONJUGATE,
526  // FLA_MINUS_ONE, A20, b10t, FLA_ONE, a21 );
529  m_ahead,
530  m_behind,
531  buff_m1,
532  A20, rs_A, cs_A,
533  b10t, cs_B,
534  buff_1,
535  a21, rs_A );
536 
537  // FLA_Inv_scal_external( beta11, a21 );
539  m_ahead,
540  beta11,
541  a21, rs_A );
542 
543  // FLA_Axpy_external( FLA_MINUS_ONE_HALF, y10t, a10t );
545  m_behind,
546  buff_m1h,
547  y10t, cs_Y,
548  a10t, cs_A );
549 
550  // FLA_Inv_scal_external( beta11, a10t );
552  m_behind,
553  beta11,
554  a10t, cs_A );
555 
556  // FLA_Ger_external( FLA_ONE, b21, a10t, Y20 );
559  m_ahead,
560  m_behind,
561  buff_1,
562  b21, rs_B,
563  a10t, cs_A,
564  Y20, rs_Y, cs_Y );
565 
566  // FLA_Copy_external( b21, y21 );
567  // FLA_Scal_external( alpha11, y21 );
569  m_ahead,
570  b21, rs_B,
571  y21, rs_Y );
573  m_ahead,
574  alpha11,
575  y21, rs_Y );
576 
577  // FLA_Gemvc_external( FLA_NO_TRANSPOSE, FLA_CONJUGATE,
578  // FLA_ONE, B20, a10t, FLA_ONE, y21 );
581  m_ahead,
582  m_behind,
583  buff_1,
584  B20, rs_B, cs_B,
585  a10t, cs_A,
586  buff_1,
587  y21, rs_Y );
588 
589  /*------------------------------------------------------------*/
590 
591  }
592 
593  return FLA_SUCCESS;
594 }
void bl1_zaxpyv(conj1_t conj, int n, dcomplex *alpha, dcomplex *x, int incx, dcomplex *y, int incy)
Definition: bl1_axpyv.c:60
void bl1_zcopyv(conj1_t conj, int m, dcomplex *x, int incx, dcomplex *y, int incy)
Definition: bl1_copyv.c:63
void bl1_zdot2s(conj1_t conj, int n, dcomplex *alpha, dcomplex *x, int incx, dcomplex *y, int incy, dcomplex *beta, dcomplex *rho)
Definition: bl1_dot2s.c:70
void bl1_zgemv(trans1_t transa, conj1_t conjx, int m, int n, dcomplex *alpha, dcomplex *a, int a_rs, int a_cs, dcomplex *x, int incx, dcomplex *beta, dcomplex *y, int incy)
Definition: bl1_gemv.c:255
void bl1_zger(conj1_t conjx, conj1_t conjy, int m, int n, dcomplex *alpha, dcomplex *x, int incx, dcomplex *y, int incy, dcomplex *a, int a_rs, int a_cs)
Definition: bl1_ger.c:194
void bl1_zinvscalv(conj1_t conj, int n, dcomplex *alpha, dcomplex *x, int incx)
Definition: bl1_invscalv.c:78
void bl1_zscalv(conj1_t conj, int n, dcomplex *alpha, dcomplex *x, int incx)
Definition: bl1_scalv.c:72

References bl1_zaxpyv(), bl1_zcopyv(), bl1_zdot2s(), bl1_zgemv(), bl1_zger(), bl1_zinvscalv(), bl1_zscalv(), BLIS1_CONJUGATE, BLIS1_NO_CONJUGATE, BLIS1_NO_TRANSPOSE, FLA_MINUS_ONE, FLA_MINUS_ONE_HALF, FLA_ONE, and i.

Referenced by FLA_Eig_gest_il_opt_var3().