libflame
revision_anchor
|
00001 /* 00002 libflame 00003 An object-based infrastructure for developing high-performance 00004 dense linear algebra libraries. 00005 00006 Copyright (C) 2011, The University of Texas 00007 00008 libflame is free software; you can redistribute it and/or modify 00009 it under the terms of the GNU Lesser General Public License as 00010 published by the Free Software Foundation; either version 2.1 of 00011 the License, or (at your option) any later version. 00012 00013 libflame is distributed in the hope that it will be useful, but 00014 WITHOUT ANY WARRANTY; without even the implied warranty of 00015 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU 00016 Lesser General Public License for more details. 00017 00018 You should have received a copy of the GNU Lesser General Public 00019 License along with libflame; if you did not receive a copy, see 00020 http://www.gnu.org/licenses/. 00021 00022 For more information, please contact us at flame@cs.utexas.edu or 00023 send mail to: 00024 00025 Field G. Van Zee and/or 00026 Robert A. van de Geijn 00027 The University of Texas at Austin 00028 Department of Computer Sciences 00029 1 University Station C0500 00030 Austin TX 78712 00031 */ 00032 00033 // --- Fused Level-1 BLAS-like prototypes -------------------------------------- 00034 00035 // --- axmyv2 --- 00036 00037 void bli_saxmyv2( conj_t conjx, int n, float* alpha, float* beta, float* x, int inc_x, float* y, int inc_y, float* z, int inc_z ); 00038 void bli_daxmyv2( conj_t conjx, int n, double* alpha, double* beta, double* x, int inc_x, double* y, int inc_y, double* z, int inc_z ); 00039 void bli_caxmyv2( conj_t conjx, int n, scomplex* alpha, scomplex* beta, scomplex* x, int inc_x, scomplex* y, int inc_y, scomplex* z, int inc_z ); 00040 void bli_zaxmyv2( conj_t conjx, int n, dcomplex* alpha, dcomplex* beta, dcomplex* x, int inc_x, dcomplex* y, int inc_y, dcomplex* z, int inc_z ); 00041 00042 // --- axpyv2b --- 00043 00044 void bli_saxpyv2b( int n, float* beta1, float* beta2, float* a1, int inc_a1, float* a2, int inc_a2, float* w, int inc_w ); 00045 void bli_daxpyv2b( int n, double* beta1, double* beta2, double* a1, int inc_a1, double* a2, int inc_a2, double* w, int inc_w ); 00046 void bli_caxpyv2b( int n, scomplex* beta1, scomplex* beta2, scomplex* a1, int inc_a1, scomplex* a2, int inc_a2, scomplex* w, int inc_w ); 00047 void bli_zaxpyv2b( int n, dcomplex* beta1, dcomplex* beta2, dcomplex* a1, int inc_a1, dcomplex* a2, int inc_a2, dcomplex* w, int inc_w ); 00048 00049 // --- axpyv3b --- 00050 00051 void bli_saxpyv3b( int n, float* beta1, float* beta2, float* beta3, float* a1, int inc_a1, float* a2, int inc_a2, float* a3, int inc_a3, float* w, int inc_w ); 00052 void bli_daxpyv3b( int n, double* beta1, double* beta2, double* beta3, double* a1, int inc_a1, double* a2, int inc_a2, double* a3, int inc_a3, double* w, int inc_w ); 00053 void bli_caxpyv3b( int n, scomplex* beta1, scomplex* beta2, scomplex* beta3, scomplex* a1, int inc_a1, scomplex* a2, int inc_a2, scomplex* a3, int inc_a3, scomplex* w, int inc_w ); 00054 void bli_zaxpyv3b( int n, dcomplex* beta1, dcomplex* beta2, dcomplex* beta3, dcomplex* a1, int inc_a1, dcomplex* a2, int inc_a2, dcomplex* a3, int inc_a3, dcomplex* w, int inc_w ); 00055 00056 // --- axpyv2bdotaxpy --- 00057 00058 void bli_saxpyv2bdotaxpy( int n, float* beta, float* u, int inc_u, float* gamma, float* z, int inc_z, float* a, int inc_a, float* x, int inc_x, float* kappa, float* rho, float* w, int inc_w ); 00059 void bli_daxpyv2bdotaxpy( int n, double* beta, double* u, int inc_u, double* gamma, double* z, int inc_z, double* a, int inc_a, double* x, int inc_x, double* kappa, double* rho, double* w, int inc_w ); 00060 void bli_caxpyv2bdotaxpy( int n, scomplex* beta, scomplex* u, int inc_u, scomplex* gamma, scomplex* z, int inc_z, scomplex* a, int inc_a, scomplex* x, int inc_x, scomplex* kappa, scomplex* rho, scomplex* w, int inc_w ); 00061 void bli_zaxpyv2bdotaxpy( int n, dcomplex* beta, dcomplex* u, int inc_u, dcomplex* gamma, dcomplex* z, int inc_z, dcomplex* a, int inc_a, dcomplex* x, int inc_x, dcomplex* kappa, dcomplex* rho, dcomplex* w, int inc_w ); 00062 00063 // --- dotsv2 --- 00064 00065 void bli_sdotsv2( conj_t conjxy, int n, float* x, int inc_x, float* y, int inc_y, float* z, int inc_z, float* beta, float* rho_xz, float* rho_yz ); 00066 void bli_ddotsv2( conj_t conjxy, int n, double* x, int inc_x, double* y, int inc_y, double* z, int inc_z, double* beta, double* rho_xz, double* rho_yz ); 00067 void bli_cdotsv2( conj_t conjxy, int n, scomplex* x, int inc_x, scomplex* y, int inc_y, scomplex* z, int inc_z, scomplex* beta, scomplex* rho_xz, scomplex* rho_yz ); 00068 void bli_zdotsv2( conj_t conjxy, int n, dcomplex* x, int inc_x, dcomplex* y, int inc_y, dcomplex* z, int inc_z, dcomplex* beta, dcomplex* rho_xz, dcomplex* rho_yz ); 00069 00070 // --- dotsv3 --- 00071 00072 void bli_sdotsv3( conj_t conjxyw, int n, float* x, int inc_x, float* y, int inc_y, float* w, int inc_w, float* z, int inc_z, float* beta, float* rho_xz, float* rho_yz, float* rho_wz ); 00073 void bli_ddotsv3( conj_t conjxyw, int n, double* x, int inc_x, double* y, int inc_y, double* w, int inc_w, double* z, int inc_z, double* beta, double* rho_xz, double* rho_yz, double* rho_wz ); 00074 void bli_cdotsv3( conj_t conjxyw, int n, scomplex* x, int inc_x, scomplex* y, int inc_y, scomplex* w, int inc_w, scomplex* z, int inc_z, scomplex* beta, scomplex* rho_xz, scomplex* rho_yz, scomplex* rho_wz ); 00075 void bli_zdotsv3( conj_t conjxyw, int n, dcomplex* x, int inc_x, dcomplex* y, int inc_y, dcomplex* w, int inc_w, dcomplex* z, int inc_z, dcomplex* beta, dcomplex* rho_xz, dcomplex* rho_yz, dcomplex* rho_wz ); 00076 00077 // --- dotaxpy --- 00078 00079 void bli_sdotaxpy( int n, float* a, int inc_a, float* x, int inc_x, float* kappa, float* rho, float* w, int inc_w ); 00080 void bli_ddotaxpy( int n, double* a, int inc_a, double* x, int inc_x, double* kappa, double* rho, double* w, int inc_w ); 00081 void bli_cdotaxpy( int n, scomplex* a, int inc_a, scomplex* x, int inc_x, scomplex* kappa, scomplex* rho, scomplex* w, int inc_w ); 00082 void bli_zdotaxpy( int n, dcomplex* a, int inc_a, dcomplex* x, int inc_x, dcomplex* kappa, dcomplex* rho, dcomplex* w, int inc_w ); 00083 00084 // --- dotaxmyv2 --- 00085 00086 void bli_sdotaxmyv2( int n, float* alpha, float* beta, float* x, int inc_x, float* u, int inc_u, float* rho, float* y, int inc_y, float* z, int inc_z ); 00087 void bli_ddotaxmyv2( int n, double* alpha, double* beta, double* x, int inc_x, double* u, int inc_u, double* rho, double* y, int inc_y, double* z, int inc_z ); 00088 void bli_cdotaxmyv2( int n, scomplex* alpha, scomplex* beta, scomplex* x, int inc_x, scomplex* u, int inc_u, scomplex* rho, scomplex* y, int inc_y, scomplex* z, int inc_z ); 00089 void bli_zdotaxmyv2( int n, dcomplex* alpha, dcomplex* beta, dcomplex* x, int inc_x, dcomplex* u, int inc_u, dcomplex* rho, dcomplex* y, int inc_y, dcomplex* z, int inc_z ); 00090 00091 // --- dotv2axpyv2b --- 00092 00093 void bli_sdotv2axpyv2b( int n, float* a1, int inc_a1, float* a2, int inc_a2, float* x, int inc_x, float* kappa1, float* kappa2, float* rho1, float* rho2, float* w, int inc_w ); 00094 void bli_ddotv2axpyv2b( int n, double* a1, int inc_a1, double* a2, int inc_a2, double* x, int inc_x, double* kappa1, double* kappa2, double* rho1, double* rho2, double* w, int inc_w ); 00095 void bli_cdotv2axpyv2b( int n, scomplex* a1, int inc_a1, scomplex* a2, int inc_a2, scomplex* x, int inc_x, scomplex* kappa1, scomplex* kappa2, scomplex* rho1, scomplex* rho2, scomplex* w, int inc_w ); 00096 void bli_zdotv2axpyv2b( int n, dcomplex* a1, int inc_a1, dcomplex* a2, int inc_a2, dcomplex* x, int inc_x, dcomplex* kappa1, dcomplex* kappa2, dcomplex* rho1, dcomplex* rho2, dcomplex* w, int inc_w ); 00097 00098 // --- axpyv2bdots --- 00099 00100 void bli_zaxpyv2bdots( int n, 00101 dcomplex* alpha1, 00102 dcomplex* alpha2, 00103 dcomplex* x1, int inc_x1, 00104 dcomplex* x2, int inc_x2, 00105 dcomplex* y, int inc_y, 00106 dcomplex* u, int inc_u, 00107 dcomplex* beta, 00108 dcomplex* rho );