libflame  revision_anchor
Functions
FLA_Axpys_external.c File Reference

(r)

Functions

FLA_Error FLA_Axpys_external (FLA_Obj alpha0, FLA_Obj alpha1, FLA_Obj A, FLA_Obj beta, FLA_Obj B)
 

Function Documentation

◆ FLA_Axpys_external()

FLA_Error FLA_Axpys_external ( FLA_Obj  alpha0,
FLA_Obj  alpha1,
FLA_Obj  A,
FLA_Obj  beta,
FLA_Obj  B 
)
14 {
15  FLA_Datatype datatype;
16  int m_B, n_B;
17  int rs_A, cs_A;
18  int rs_B, cs_B;
19  trans1_t blis_trans;
20 
21  if ( FLA_Check_error_level() == FLA_FULL_ERROR_CHECKING )
22  FLA_Axpys_check( alpha0, alpha1, A, beta, B );
23 
24  if ( FLA_Obj_has_zero_dim( A ) ) return FLA_SUCCESS;
25 
26  datatype = FLA_Obj_datatype( A );
27 
28  rs_A = FLA_Obj_row_stride( A );
29  cs_A = FLA_Obj_col_stride( A );
30 
31  m_B = FLA_Obj_length( B );
32  n_B = FLA_Obj_width( B );
33  rs_B = FLA_Obj_row_stride( B );
34  cs_B = FLA_Obj_col_stride( B );
35 
36  FLA_Param_map_flame_to_blis_trans( FLA_NO_TRANSPOSE, &blis_trans );
37 
38  switch ( datatype ){
39 
40  case FLA_FLOAT:
41  {
42  float *buff_alpha0 = ( float * ) FLA_FLOAT_PTR( alpha0 );
43  float *buff_alpha1 = ( float * ) FLA_FLOAT_PTR( alpha1 );
44  float *buff_beta = ( float * ) FLA_FLOAT_PTR( beta );
45  float *buff_A = ( float * ) FLA_FLOAT_PTR( A );
46  float *buff_B = ( float * ) FLA_FLOAT_PTR( B );
47 
48  bl1_saxpysmt( blis_trans,
49  m_B,
50  n_B,
51  buff_alpha0,
52  buff_alpha1,
53  buff_A, rs_A, cs_A,
54  buff_beta,
55  buff_B, rs_B, cs_B );
56 
57  break;
58  }
59 
60  case FLA_DOUBLE:
61  {
62  double *buff_alpha0 = ( double * ) FLA_DOUBLE_PTR( alpha0 );
63  double *buff_alpha1 = ( double * ) FLA_DOUBLE_PTR( alpha1 );
64  double *buff_beta = ( double * ) FLA_DOUBLE_PTR( beta );
65  double *buff_A = ( double * ) FLA_DOUBLE_PTR( A );
66  double *buff_B = ( double * ) FLA_DOUBLE_PTR( B );
67 
68  bl1_daxpysmt( blis_trans,
69  m_B,
70  n_B,
71  buff_alpha0,
72  buff_alpha1,
73  buff_A, rs_A, cs_A,
74  buff_beta,
75  buff_B, rs_B, cs_B );
76 
77  break;
78  }
79 
80  case FLA_COMPLEX:
81  {
82  scomplex *buff_alpha0 = ( scomplex * ) FLA_COMPLEX_PTR( alpha0 );
83  scomplex *buff_alpha1 = ( scomplex * ) FLA_COMPLEX_PTR( alpha1 );
84  scomplex *buff_beta = ( scomplex * ) FLA_COMPLEX_PTR( beta );
85  scomplex *buff_A = ( scomplex * ) FLA_COMPLEX_PTR( A );
86  scomplex *buff_B = ( scomplex * ) FLA_COMPLEX_PTR( B );
87 
88  bl1_caxpysmt( blis_trans,
89  m_B,
90  n_B,
91  buff_alpha0,
92  buff_alpha1,
93  buff_A, rs_A, cs_A,
94  buff_beta,
95  buff_B, rs_B, cs_B );
96 
97  break;
98  }
99 
100  case FLA_DOUBLE_COMPLEX:
101  {
102  dcomplex *buff_alpha0 = ( dcomplex * ) FLA_DOUBLE_COMPLEX_PTR( alpha0 );
103  dcomplex *buff_alpha1 = ( dcomplex * ) FLA_DOUBLE_COMPLEX_PTR( alpha1 );
104  dcomplex *buff_beta = ( dcomplex * ) FLA_DOUBLE_COMPLEX_PTR( beta );
105  dcomplex *buff_A = ( dcomplex * ) FLA_DOUBLE_COMPLEX_PTR( A );
106  dcomplex *buff_B = ( dcomplex * ) FLA_DOUBLE_COMPLEX_PTR( B );
107 
108  bl1_zaxpysmt( blis_trans,
109  m_B,
110  n_B,
111  buff_alpha0,
112  buff_alpha1,
113  buff_A, rs_A, cs_A,
114  buff_beta,
115  buff_B, rs_B, cs_B );
116 
117  break;
118  }
119 
120  }
121 
122  return FLA_SUCCESS;
123 }
FLA_Error FLA_Axpys_check(FLA_Obj alpha0, FLA_Obj alpha1, FLA_Obj A, FLA_Obj beta, FLA_Obj B)
Definition: FLA_Axpys_check.c:13
dim_t FLA_Obj_width(FLA_Obj obj)
Definition: FLA_Query.c:123
FLA_Bool FLA_Obj_has_zero_dim(FLA_Obj A)
Definition: FLA_Query.c:400
dim_t FLA_Obj_row_stride(FLA_Obj obj)
Definition: FLA_Query.c:167
dim_t FLA_Obj_length(FLA_Obj obj)
Definition: FLA_Query.c:116
void FLA_Param_map_flame_to_blis_trans(FLA_Trans trans, trans1_t *blis_trans)
Definition: FLA_Param.c:245
dim_t FLA_Obj_col_stride(FLA_Obj obj)
Definition: FLA_Query.c:174
unsigned int FLA_Check_error_level(void)
Definition: FLA_Check.c:18
FLA_Datatype FLA_Obj_datatype(FLA_Obj obj)
Definition: FLA_Query.c:13
int FLA_Datatype
Definition: FLA_type_defs.h:49
void bl1_zaxpysmt(trans1_t trans, int m, int n, dcomplex *alpha0, dcomplex *alpha1, dcomplex *a, int a_rs, int a_cs, dcomplex *beta, dcomplex *b, int b_rs, int b_cs)
Definition: bl1_axpysmt.c:273
void bl1_saxpysmt(trans1_t trans, int m, int n, float *alpha0, float *alpha1, float *a, int a_rs, int a_cs, float *beta, float *b, int b_rs, int b_cs)
Definition: bl1_axpysmt.c:13
void bl1_caxpysmt(trans1_t trans, int m, int n, scomplex *alpha0, scomplex *alpha1, scomplex *a, int a_rs, int a_cs, scomplex *beta, scomplex *b, int b_rs, int b_cs)
Definition: bl1_axpysmt.c:163
void bl1_daxpysmt(trans1_t trans, int m, int n, double *alpha0, double *alpha1, double *a, int a_rs, int a_cs, double *beta, double *b, int b_rs, int b_cs)
Definition: bl1_axpysmt.c:88
double *restrict alpha1
Definition: bl1_axpyv2bdotaxpy.c:198
trans1_t
Definition: blis_type_defs.h:53
Definition: blis_type_defs.h:138
Definition: blis_type_defs.h:133

References alpha1, bl1_caxpysmt(), bl1_daxpysmt(), bl1_saxpysmt(), bl1_zaxpysmt(), FLA_Axpys_check(), FLA_Check_error_level(), FLA_Obj_col_stride(), FLA_Obj_datatype(), FLA_Obj_has_zero_dim(), FLA_Obj_length(), FLA_Obj_row_stride(), FLA_Obj_width(), and FLA_Param_map_flame_to_blis_trans().

Referenced by FLA_Axpys(), FLA_Hemm_ll_unb_var1(), FLA_Hemm_ll_unb_var2(), FLA_Hemm_ll_unb_var3(), FLA_Hemm_ll_unb_var4(), FLA_Hemm_ll_unb_var5(), FLA_Hemm_ll_unb_var6(), FLA_Hemm_ll_unb_var7(), FLA_Hemm_ll_unb_var8(), FLA_Hemm_lu_unb_var1(), FLA_Hemm_lu_unb_var2(), FLA_Hemm_lu_unb_var3(), FLA_Hemm_lu_unb_var4(), FLA_Hemm_lu_unb_var5(), FLA_Hemm_lu_unb_var6(), FLA_Hemm_lu_unb_var7(), FLA_Hemm_lu_unb_var8(), FLA_Hemm_rl_unb_var1(), FLA_Hemm_rl_unb_var2(), FLA_Hemm_rl_unb_var3(), FLA_Hemm_rl_unb_var4(), FLA_Hemm_rl_unb_var5(), FLA_Hemm_rl_unb_var6(), FLA_Hemm_rl_unb_var7(), FLA_Hemm_rl_unb_var8(), FLA_Hemm_ru_unb_var1(), FLA_Hemm_ru_unb_var2(), FLA_Hemm_ru_unb_var3(), FLA_Hemm_ru_unb_var4(), FLA_Hemm_ru_unb_var5(), FLA_Hemm_ru_unb_var6(), FLA_Hemm_ru_unb_var7(), FLA_Hemm_ru_unb_var8(), FLA_Symm_ll_unb_var1(), FLA_Symm_ll_unb_var2(), FLA_Symm_ll_unb_var3(), FLA_Symm_ll_unb_var4(), FLA_Symm_ll_unb_var5(), FLA_Symm_ll_unb_var6(), FLA_Symm_ll_unb_var7(), FLA_Symm_ll_unb_var8(), FLA_Symm_lu_unb_var1(), FLA_Symm_lu_unb_var2(), FLA_Symm_lu_unb_var3(), FLA_Symm_lu_unb_var4(), FLA_Symm_lu_unb_var5(), FLA_Symm_lu_unb_var6(), FLA_Symm_lu_unb_var7(), FLA_Symm_lu_unb_var8(), FLA_Symm_rl_unb_var1(), FLA_Symm_rl_unb_var2(), FLA_Symm_rl_unb_var3(), FLA_Symm_rl_unb_var4(), FLA_Symm_rl_unb_var5(), FLA_Symm_rl_unb_var6(), FLA_Symm_rl_unb_var7(), FLA_Symm_rl_unb_var8(), FLA_Symm_ru_unb_var1(), FLA_Symm_ru_unb_var2(), FLA_Symm_ru_unb_var3(), FLA_Symm_ru_unb_var4(), FLA_Symm_ru_unb_var5(), FLA_Symm_ru_unb_var6(), FLA_Symm_ru_unb_var7(), and FLA_Symm_ru_unb_var8().