|
libflame
12600
|
Functions | |
| void | bl1_saxpymrt (uplo1_t uplo, trans1_t trans, int m, int n, float *alpha, float *a, int a_rs, int a_cs, float *b, int b_rs, int b_cs) |
| void | bl1_daxpymrt (uplo1_t uplo, trans1_t trans, int m, int n, double *alpha, double *a, int a_rs, int a_cs, double *b, int b_rs, int b_cs) |
| void | bl1_caxpymrt (uplo1_t uplo, trans1_t trans, int m, int n, scomplex *alpha, scomplex *a, int a_rs, int a_cs, scomplex *b, int b_rs, int b_cs) |
| void | bl1_zaxpymrt (uplo1_t uplo, trans1_t trans, int m, int n, dcomplex *alpha, dcomplex *a, int a_rs, int a_cs, dcomplex *b, int b_rs, int b_cs) |
| void bl1_caxpymrt | ( | uplo1_t | uplo, |
| trans1_t | trans, | ||
| int | m, | ||
| int | n, | ||
| scomplex * | alpha, | ||
| scomplex * | a, | ||
| int | a_rs, | ||
| int | a_cs, | ||
| scomplex * | b, | ||
| int | b_rs, | ||
| int | b_cs | ||
| ) |
References bl1_caxpyv(), bl1_does_trans(), bl1_is_col_storage(), bl1_is_lower(), bl1_proj_trans1_to_conj(), and bl1_zero_dim2().
Referenced by bl1_cher2k(), bl1_cherk(), and FLA_Axpyrt_external().
{
scomplex* a_begin;
scomplex* b_begin;
int lda, inca;
int ldb, incb;
int n_iter;
int n_elem;
int n_elem_max;
int n_elem_is_descending;
int j;
conj1_t conj;
// Return early if possible.
if ( bl1_zero_dim2( m, n ) ) return;
// Initialize variables based on storage format of B and value of uplo.
if ( bl1_is_col_storage( b_rs, b_cs ) )
{
if ( bl1_is_lower( uplo ) )
{
n_iter = bl1_min( m, n );
n_elem_max = m;
lda = a_cs;
inca = a_rs;
ldb = b_cs;
incb = b_rs;
n_elem_is_descending = TRUE;
}
else // if ( bl1_is_upper( uplo ) )
{
n_iter = n;
n_elem_max = bl1_min( m, n );
lda = a_cs;
inca = a_rs;
ldb = b_cs;
incb = b_rs;
n_elem_is_descending = FALSE;
}
}
else // if ( bl1_is_row_storage( b_rs, b_cs ) )
{
if ( bl1_is_lower( uplo ) )
{
n_iter = m;
n_elem_max = bl1_min( m, n );
lda = a_rs;
inca = a_cs;
ldb = b_rs;
incb = b_cs;
n_elem_is_descending = FALSE;
}
else // if ( bl1_is_upper( uplo ) )
{
n_iter = bl1_min( m, n );
n_elem_max = n;
lda = a_rs;
inca = a_cs;
ldb = b_rs;
incb = b_cs;
n_elem_is_descending = TRUE;
}
}
// Swap lda and inca if we're doing a transpose.
if ( bl1_does_trans( trans ) )
{
bl1_swap_ints( lda, inca );
}
// Extract conj component from trans parameter.
conj = bl1_proj_trans1_to_conj( trans );
// Choose the loop based on whether n_elem will be shrinking or growing
// with each iteration.
if ( n_elem_is_descending )
{
for ( j = 0; j < n_iter; j++ )
{
n_elem = n_elem_max - j;
a_begin = a + j*lda + j*inca;
b_begin = b + j*ldb + j*incb;
bl1_caxpyv( conj,
n_elem,
alpha,
a_begin, inca,
b_begin, incb );
}
}
else // if ( n_elem_is_ascending )
{
for ( j = 0; j < n_iter; j++ )
{
n_elem = bl1_min( j + 1, n_elem_max );
a_begin = a + j*lda;
b_begin = b + j*ldb;
bl1_caxpyv( conj,
n_elem,
alpha,
a_begin, inca,
b_begin, incb );
}
}
}
| void bl1_daxpymrt | ( | uplo1_t | uplo, |
| trans1_t | trans, | ||
| int | m, | ||
| int | n, | ||
| double * | alpha, | ||
| double * | a, | ||
| int | a_rs, | ||
| int | a_cs, | ||
| double * | b, | ||
| int | b_rs, | ||
| int | b_cs | ||
| ) |
References bl1_daxpyv(), bl1_does_trans(), bl1_is_col_storage(), bl1_is_lower(), bl1_proj_trans1_to_conj(), and bl1_zero_dim2().
Referenced by FLA_Axpyrt_external().
{
double* a_begin;
double* b_begin;
int lda, inca;
int ldb, incb;
int n_iter;
int n_elem;
int n_elem_max;
int n_elem_is_descending;
int j;
conj1_t conj;
// Return early if possible.
if ( bl1_zero_dim2( m, n ) ) return;
// Initialize variables based on storage format of B and value of uplo.
if ( bl1_is_col_storage( b_rs, b_cs ) )
{
if ( bl1_is_lower( uplo ) )
{
n_iter = bl1_min( m, n );
n_elem_max = m;
lda = a_cs;
inca = a_rs;
ldb = b_cs;
incb = b_rs;
n_elem_is_descending = TRUE;
}
else // if ( bl1_is_upper( uplo ) )
{
n_iter = n;
n_elem_max = bl1_min( m, n );
lda = a_cs;
inca = a_rs;
ldb = b_cs;
incb = b_rs;
n_elem_is_descending = FALSE;
}
}
else // if ( bl1_is_row_storage( b_rs, b_cs ) )
{
if ( bl1_is_lower( uplo ) )
{
n_iter = m;
n_elem_max = bl1_min( m, n );
lda = a_rs;
inca = a_cs;
ldb = b_rs;
incb = b_cs;
n_elem_is_descending = FALSE;
}
else // if ( bl1_is_upper( uplo ) )
{
n_iter = bl1_min( m, n );
n_elem_max = n;
lda = a_rs;
inca = a_cs;
ldb = b_rs;
incb = b_cs;
n_elem_is_descending = TRUE;
}
}
// Swap lda and inca if we're doing a transpose.
if ( bl1_does_trans( trans ) )
{
bl1_swap_ints( lda, inca );
}
// Extract conj component from trans parameter.
conj = bl1_proj_trans1_to_conj( trans );
// Choose the loop based on whether n_elem will be shrinking or growing
// with each iteration.
if ( n_elem_is_descending )
{
for ( j = 0; j < n_iter; j++ )
{
n_elem = n_elem_max - j;
a_begin = a + j*lda + j*inca;
b_begin = b + j*ldb + j*incb;
bl1_daxpyv( conj,
n_elem,
alpha,
a_begin, inca,
b_begin, incb );
}
}
else // if ( n_elem_is_ascending )
{
for ( j = 0; j < n_iter; j++ )
{
n_elem = bl1_min( j + 1, n_elem_max );
a_begin = a + j*lda;
b_begin = b + j*ldb;
bl1_daxpyv( conj,
n_elem,
alpha,
a_begin, inca,
b_begin, incb );
}
}
}
| void bl1_saxpymrt | ( | uplo1_t | uplo, |
| trans1_t | trans, | ||
| int | m, | ||
| int | n, | ||
| float * | alpha, | ||
| float * | a, | ||
| int | a_rs, | ||
| int | a_cs, | ||
| float * | b, | ||
| int | b_rs, | ||
| int | b_cs | ||
| ) |
References bl1_does_trans(), bl1_is_col_storage(), bl1_is_lower(), bl1_proj_trans1_to_conj(), bl1_saxpyv(), and bl1_zero_dim2().
Referenced by FLA_Axpyrt_external().
{
float* a_begin;
float* b_begin;
int lda, inca;
int ldb, incb;
int n_iter;
int n_elem;
int n_elem_max;
int n_elem_is_descending;
int j;
conj1_t conj;
// Return early if possible.
if ( bl1_zero_dim2( m, n ) ) return;
// Initialize variables based on storage format of B and value of uplo.
if ( bl1_is_col_storage( b_rs, b_cs ) )
{
if ( bl1_is_lower( uplo ) )
{
n_iter = bl1_min( m, n );
n_elem_max = m;
lda = a_cs;
inca = a_rs;
ldb = b_cs;
incb = b_rs;
n_elem_is_descending = TRUE;
}
else // if ( bl1_is_upper( uplo ) )
{
n_iter = n;
n_elem_max = bl1_min( m, n );
lda = a_cs;
inca = a_rs;
ldb = b_cs;
incb = b_rs;
n_elem_is_descending = FALSE;
}
}
else // if ( bl1_is_row_storage( b_rs, b_cs ) )
{
if ( bl1_is_lower( uplo ) )
{
n_iter = m;
n_elem_max = bl1_min( m, n );
lda = a_rs;
inca = a_cs;
ldb = b_rs;
incb = b_cs;
n_elem_is_descending = FALSE;
}
else // if ( bl1_is_upper( uplo ) )
{
n_iter = bl1_min( m, n );
n_elem_max = n;
lda = a_rs;
inca = a_cs;
ldb = b_rs;
incb = b_cs;
n_elem_is_descending = TRUE;
}
}
// Swap lda and inca if we're doing a transpose.
if ( bl1_does_trans( trans ) )
{
bl1_swap_ints( lda, inca );
}
// Extract conj component from trans parameter.
conj = bl1_proj_trans1_to_conj( trans );
// Choose the loop based on whether n_elem will be shrinking or growing
// with each iteration.
if ( n_elem_is_descending )
{
for ( j = 0; j < n_iter; j++ )
{
n_elem = n_elem_max - j;
a_begin = a + j*lda + j*inca;
b_begin = b + j*ldb + j*incb;
bl1_saxpyv( conj,
n_elem,
alpha,
a_begin, inca,
b_begin, incb );
}
}
else // if ( n_elem_is_ascending )
{
for ( j = 0; j < n_iter; j++ )
{
n_elem = bl1_min( j + 1, n_elem_max );
a_begin = a + j*lda;
b_begin = b + j*ldb;
bl1_saxpyv( conj,
n_elem,
alpha,
a_begin, inca,
b_begin, incb );
}
}
}
| void bl1_zaxpymrt | ( | uplo1_t | uplo, |
| trans1_t | trans, | ||
| int | m, | ||
| int | n, | ||
| dcomplex * | alpha, | ||
| dcomplex * | a, | ||
| int | a_rs, | ||
| int | a_cs, | ||
| dcomplex * | b, | ||
| int | b_rs, | ||
| int | b_cs | ||
| ) |
References bl1_does_trans(), bl1_is_col_storage(), bl1_is_lower(), bl1_proj_trans1_to_conj(), bl1_zaxpyv(), and bl1_zero_dim2().
Referenced by bl1_zher2k(), bl1_zherk(), and FLA_Axpyrt_external().
{
dcomplex* a_begin;
dcomplex* b_begin;
int lda, inca;
int ldb, incb;
int n_iter;
int n_elem;
int n_elem_max;
int n_elem_is_descending;
int j;
conj1_t conj;
// Return early if possible.
if ( bl1_zero_dim2( m, n ) ) return;
// Initialize variables based on storage format of B and value of uplo.
if ( bl1_is_col_storage( b_rs, b_cs ) )
{
if ( bl1_is_lower( uplo ) )
{
n_iter = bl1_min( m, n );
n_elem_max = m;
lda = a_cs;
inca = a_rs;
ldb = b_cs;
incb = b_rs;
n_elem_is_descending = TRUE;
}
else // if ( bl1_is_upper( uplo ) )
{
n_iter = n;
n_elem_max = bl1_min( m, n );
lda = a_cs;
inca = a_rs;
ldb = b_cs;
incb = b_rs;
n_elem_is_descending = FALSE;
}
}
else // if ( bl1_is_row_storage( b_rs, b_cs ) )
{
if ( bl1_is_lower( uplo ) )
{
n_iter = m;
n_elem_max = bl1_min( m, n );
lda = a_rs;
inca = a_cs;
ldb = b_rs;
incb = b_cs;
n_elem_is_descending = FALSE;
}
else // if ( bl1_is_upper( uplo ) )
{
n_iter = bl1_min( m, n );
n_elem_max = n;
lda = a_rs;
inca = a_cs;
ldb = b_rs;
incb = b_cs;
n_elem_is_descending = TRUE;
}
}
// Swap lda and inca if we're doing a transpose.
if ( bl1_does_trans( trans ) )
{
bl1_swap_ints( lda, inca );
}
// Extract conj component from trans parameter.
conj = bl1_proj_trans1_to_conj( trans );
// Choose the loop based on whether n_elem will be shrinking or growing
// with each iteration.
if ( n_elem_is_descending )
{
for ( j = 0; j < n_iter; j++ )
{
n_elem = n_elem_max - j;
a_begin = a + j*lda + j*inca;
b_begin = b + j*ldb + j*incb;
bl1_zaxpyv( conj,
n_elem,
alpha,
a_begin, inca,
b_begin, incb );
}
}
else // if ( n_elem_is_ascending )
{
for ( j = 0; j < n_iter; j++ )
{
n_elem = bl1_min( j + 1, n_elem_max );
a_begin = a + j*lda;
b_begin = b + j*ldb;
bl1_zaxpyv( conj,
n_elem,
alpha,
a_begin, inca,
b_begin, incb );
}
}
}
1.7.6.1