libflame  revision_anchor
Functions
bli_conjm.c File Reference

(r)

Functions

void bli_sconjm (int m, int n, float *a, int a_rs, int a_cs)
void bli_dconjm (int m, int n, double *a, int a_rs, int a_cs)
void bli_cconjm (int m, int n, scomplex *a, int a_rs, int a_cs)
void bli_zconjm (int m, int n, dcomplex *a, int a_rs, int a_cs)

Function Documentation

void bli_cconjm ( int  m,
int  n,
scomplex a,
int  a_rs,
int  a_cs 
)

References bli_is_row_storage(), bli_is_vector(), bli_sm1(), bli_sscal(), bli_vector_dim(), bli_vector_inc(), bli_zero_dim2(), and BLIS_NO_TRANSPOSE.

Referenced by bli_cgemm(), and FLA_Conjugate().

{
    float   m1 = bli_sm1();
    float*  a_conj;
    int     lda, inca;
    int     n_iter;
    int     n_elem;
    int     j;

    // Return early if possible.
    if ( bli_zero_dim2( m, n ) ) return;

    // Handle cases where A is a vector to ensure that the underlying axpy
    // gets invoked only once.
    if ( bli_is_vector( m, n ) )
    {
        // Initialize with values appropriate for a vector.
        n_iter = 1;
        n_elem = bli_vector_dim( m, n );
        lda    = 1; // multiplied by zero when n_iter == 1; not needed.
        inca   = bli_vector_inc( BLIS_NO_TRANSPOSE, m, n, a_rs, a_cs );
    }
    else // matrix case
    {
        // Initialize with optimal values for column-major storage.
        n_iter = n;
        n_elem = m;
        lda    = a_cs;
        inca   = a_rs;

        // An optimization: if A is row-major, then let's access the matrix
        // by rows instead of by columns to increase spatial locality.
        if ( bli_is_row_storage( a_rs, a_cs ) )
        {
            bli_swap_ints( n_iter, n_elem );
            bli_swap_ints( lda, inca );
        }
    }

    for ( j = 0; j < n_iter; ++j )
    {
        a_conj = ( float* )( a + j*lda ) + 1;

        bli_sscal( n_elem,
                   &m1,
                   a_conj, 2*inca );
    }
}
void bli_dconjm ( int  m,
int  n,
double *  a,
int  a_rs,
int  a_cs 
)
{
    return;
}
void bli_sconjm ( int  m,
int  n,
float *  a,
int  a_rs,
int  a_cs 
)
{
    return;
}
void bli_zconjm ( int  m,
int  n,
dcomplex a,
int  a_rs,
int  a_cs 
)

References bli_dm1(), bli_dscal(), bli_is_row_storage(), bli_is_vector(), bli_vector_dim(), bli_vector_inc(), bli_zero_dim2(), and BLIS_NO_TRANSPOSE.

Referenced by bli_zgemm(), and FLA_Conjugate().

{
    double  m1 = bli_dm1();
    double* a_conj;
    int     lda, inca;
    int     n_iter;
    int     n_elem;
    int     j;

    // Return early if possible.
    if ( bli_zero_dim2( m, n ) ) return;

    // Handle cases where A is a vector to ensure that the underlying axpy
    // gets invoked only once.
    if ( bli_is_vector( m, n ) )
    {
        // Initialize with values appropriate for a vector.
        n_iter = 1;
        n_elem = bli_vector_dim( m, n );
        lda    = 1; // multiplied by zero when n_iter == 1; not needed.
        inca   = bli_vector_inc( BLIS_NO_TRANSPOSE, m, n, a_rs, a_cs );
    }
    else // matrix case
    {
        // Initialize with optimal values for column-major storage.
        n_iter = n;
        n_elem = m;
        lda    = a_cs;
        inca   = a_rs;

        // An optimization: if A is row-major, then let's access the matrix
        // by rows instead of by columns to increase spatial locality.
        if ( bli_is_row_storage( a_rs, a_cs ) )
        {
            bli_swap_ints( n_iter, n_elem );
            bli_swap_ints( lda, inca );
        }
    }

    for ( j = 0; j < n_iter; ++j )
    {
        a_conj = ( double* )( a + j*lda ) + 1;

        bli_dscal( n_elem,
                   &m1,
                   a_conj, 2*inca );
    }
}