libflame
12600
|
Functions | |
void | bl1_saxpymrt (uplo1_t uplo, trans1_t trans, int m, int n, float *alpha, float *a, int a_rs, int a_cs, float *b, int b_rs, int b_cs) |
void | bl1_daxpymrt (uplo1_t uplo, trans1_t trans, int m, int n, double *alpha, double *a, int a_rs, int a_cs, double *b, int b_rs, int b_cs) |
void | bl1_caxpymrt (uplo1_t uplo, trans1_t trans, int m, int n, scomplex *alpha, scomplex *a, int a_rs, int a_cs, scomplex *b, int b_rs, int b_cs) |
void | bl1_zaxpymrt (uplo1_t uplo, trans1_t trans, int m, int n, dcomplex *alpha, dcomplex *a, int a_rs, int a_cs, dcomplex *b, int b_rs, int b_cs) |
void bl1_caxpymrt | ( | uplo1_t | uplo, |
trans1_t | trans, | ||
int | m, | ||
int | n, | ||
scomplex * | alpha, | ||
scomplex * | a, | ||
int | a_rs, | ||
int | a_cs, | ||
scomplex * | b, | ||
int | b_rs, | ||
int | b_cs | ||
) |
References bl1_caxpyv(), bl1_does_trans(), bl1_is_col_storage(), bl1_is_lower(), bl1_proj_trans1_to_conj(), and bl1_zero_dim2().
Referenced by bl1_cher2k(), bl1_cherk(), and FLA_Axpyrt_external().
{ scomplex* a_begin; scomplex* b_begin; int lda, inca; int ldb, incb; int n_iter; int n_elem; int n_elem_max; int n_elem_is_descending; int j; conj1_t conj; // Return early if possible. if ( bl1_zero_dim2( m, n ) ) return; // Initialize variables based on storage format of B and value of uplo. if ( bl1_is_col_storage( b_rs, b_cs ) ) { if ( bl1_is_lower( uplo ) ) { n_iter = bl1_min( m, n ); n_elem_max = m; lda = a_cs; inca = a_rs; ldb = b_cs; incb = b_rs; n_elem_is_descending = TRUE; } else // if ( bl1_is_upper( uplo ) ) { n_iter = n; n_elem_max = bl1_min( m, n ); lda = a_cs; inca = a_rs; ldb = b_cs; incb = b_rs; n_elem_is_descending = FALSE; } } else // if ( bl1_is_row_storage( b_rs, b_cs ) ) { if ( bl1_is_lower( uplo ) ) { n_iter = m; n_elem_max = bl1_min( m, n ); lda = a_rs; inca = a_cs; ldb = b_rs; incb = b_cs; n_elem_is_descending = FALSE; } else // if ( bl1_is_upper( uplo ) ) { n_iter = bl1_min( m, n ); n_elem_max = n; lda = a_rs; inca = a_cs; ldb = b_rs; incb = b_cs; n_elem_is_descending = TRUE; } } // Swap lda and inca if we're doing a transpose. if ( bl1_does_trans( trans ) ) { bl1_swap_ints( lda, inca ); } // Extract conj component from trans parameter. conj = bl1_proj_trans1_to_conj( trans ); // Choose the loop based on whether n_elem will be shrinking or growing // with each iteration. if ( n_elem_is_descending ) { for ( j = 0; j < n_iter; j++ ) { n_elem = n_elem_max - j; a_begin = a + j*lda + j*inca; b_begin = b + j*ldb + j*incb; bl1_caxpyv( conj, n_elem, alpha, a_begin, inca, b_begin, incb ); } } else // if ( n_elem_is_ascending ) { for ( j = 0; j < n_iter; j++ ) { n_elem = bl1_min( j + 1, n_elem_max ); a_begin = a + j*lda; b_begin = b + j*ldb; bl1_caxpyv( conj, n_elem, alpha, a_begin, inca, b_begin, incb ); } } }
void bl1_daxpymrt | ( | uplo1_t | uplo, |
trans1_t | trans, | ||
int | m, | ||
int | n, | ||
double * | alpha, | ||
double * | a, | ||
int | a_rs, | ||
int | a_cs, | ||
double * | b, | ||
int | b_rs, | ||
int | b_cs | ||
) |
References bl1_daxpyv(), bl1_does_trans(), bl1_is_col_storage(), bl1_is_lower(), bl1_proj_trans1_to_conj(), and bl1_zero_dim2().
Referenced by FLA_Axpyrt_external().
{ double* a_begin; double* b_begin; int lda, inca; int ldb, incb; int n_iter; int n_elem; int n_elem_max; int n_elem_is_descending; int j; conj1_t conj; // Return early if possible. if ( bl1_zero_dim2( m, n ) ) return; // Initialize variables based on storage format of B and value of uplo. if ( bl1_is_col_storage( b_rs, b_cs ) ) { if ( bl1_is_lower( uplo ) ) { n_iter = bl1_min( m, n ); n_elem_max = m; lda = a_cs; inca = a_rs; ldb = b_cs; incb = b_rs; n_elem_is_descending = TRUE; } else // if ( bl1_is_upper( uplo ) ) { n_iter = n; n_elem_max = bl1_min( m, n ); lda = a_cs; inca = a_rs; ldb = b_cs; incb = b_rs; n_elem_is_descending = FALSE; } } else // if ( bl1_is_row_storage( b_rs, b_cs ) ) { if ( bl1_is_lower( uplo ) ) { n_iter = m; n_elem_max = bl1_min( m, n ); lda = a_rs; inca = a_cs; ldb = b_rs; incb = b_cs; n_elem_is_descending = FALSE; } else // if ( bl1_is_upper( uplo ) ) { n_iter = bl1_min( m, n ); n_elem_max = n; lda = a_rs; inca = a_cs; ldb = b_rs; incb = b_cs; n_elem_is_descending = TRUE; } } // Swap lda and inca if we're doing a transpose. if ( bl1_does_trans( trans ) ) { bl1_swap_ints( lda, inca ); } // Extract conj component from trans parameter. conj = bl1_proj_trans1_to_conj( trans ); // Choose the loop based on whether n_elem will be shrinking or growing // with each iteration. if ( n_elem_is_descending ) { for ( j = 0; j < n_iter; j++ ) { n_elem = n_elem_max - j; a_begin = a + j*lda + j*inca; b_begin = b + j*ldb + j*incb; bl1_daxpyv( conj, n_elem, alpha, a_begin, inca, b_begin, incb ); } } else // if ( n_elem_is_ascending ) { for ( j = 0; j < n_iter; j++ ) { n_elem = bl1_min( j + 1, n_elem_max ); a_begin = a + j*lda; b_begin = b + j*ldb; bl1_daxpyv( conj, n_elem, alpha, a_begin, inca, b_begin, incb ); } } }
void bl1_saxpymrt | ( | uplo1_t | uplo, |
trans1_t | trans, | ||
int | m, | ||
int | n, | ||
float * | alpha, | ||
float * | a, | ||
int | a_rs, | ||
int | a_cs, | ||
float * | b, | ||
int | b_rs, | ||
int | b_cs | ||
) |
References bl1_does_trans(), bl1_is_col_storage(), bl1_is_lower(), bl1_proj_trans1_to_conj(), bl1_saxpyv(), and bl1_zero_dim2().
Referenced by FLA_Axpyrt_external().
{ float* a_begin; float* b_begin; int lda, inca; int ldb, incb; int n_iter; int n_elem; int n_elem_max; int n_elem_is_descending; int j; conj1_t conj; // Return early if possible. if ( bl1_zero_dim2( m, n ) ) return; // Initialize variables based on storage format of B and value of uplo. if ( bl1_is_col_storage( b_rs, b_cs ) ) { if ( bl1_is_lower( uplo ) ) { n_iter = bl1_min( m, n ); n_elem_max = m; lda = a_cs; inca = a_rs; ldb = b_cs; incb = b_rs; n_elem_is_descending = TRUE; } else // if ( bl1_is_upper( uplo ) ) { n_iter = n; n_elem_max = bl1_min( m, n ); lda = a_cs; inca = a_rs; ldb = b_cs; incb = b_rs; n_elem_is_descending = FALSE; } } else // if ( bl1_is_row_storage( b_rs, b_cs ) ) { if ( bl1_is_lower( uplo ) ) { n_iter = m; n_elem_max = bl1_min( m, n ); lda = a_rs; inca = a_cs; ldb = b_rs; incb = b_cs; n_elem_is_descending = FALSE; } else // if ( bl1_is_upper( uplo ) ) { n_iter = bl1_min( m, n ); n_elem_max = n; lda = a_rs; inca = a_cs; ldb = b_rs; incb = b_cs; n_elem_is_descending = TRUE; } } // Swap lda and inca if we're doing a transpose. if ( bl1_does_trans( trans ) ) { bl1_swap_ints( lda, inca ); } // Extract conj component from trans parameter. conj = bl1_proj_trans1_to_conj( trans ); // Choose the loop based on whether n_elem will be shrinking or growing // with each iteration. if ( n_elem_is_descending ) { for ( j = 0; j < n_iter; j++ ) { n_elem = n_elem_max - j; a_begin = a + j*lda + j*inca; b_begin = b + j*ldb + j*incb; bl1_saxpyv( conj, n_elem, alpha, a_begin, inca, b_begin, incb ); } } else // if ( n_elem_is_ascending ) { for ( j = 0; j < n_iter; j++ ) { n_elem = bl1_min( j + 1, n_elem_max ); a_begin = a + j*lda; b_begin = b + j*ldb; bl1_saxpyv( conj, n_elem, alpha, a_begin, inca, b_begin, incb ); } } }
void bl1_zaxpymrt | ( | uplo1_t | uplo, |
trans1_t | trans, | ||
int | m, | ||
int | n, | ||
dcomplex * | alpha, | ||
dcomplex * | a, | ||
int | a_rs, | ||
int | a_cs, | ||
dcomplex * | b, | ||
int | b_rs, | ||
int | b_cs | ||
) |
References bl1_does_trans(), bl1_is_col_storage(), bl1_is_lower(), bl1_proj_trans1_to_conj(), bl1_zaxpyv(), and bl1_zero_dim2().
Referenced by bl1_zher2k(), bl1_zherk(), and FLA_Axpyrt_external().
{ dcomplex* a_begin; dcomplex* b_begin; int lda, inca; int ldb, incb; int n_iter; int n_elem; int n_elem_max; int n_elem_is_descending; int j; conj1_t conj; // Return early if possible. if ( bl1_zero_dim2( m, n ) ) return; // Initialize variables based on storage format of B and value of uplo. if ( bl1_is_col_storage( b_rs, b_cs ) ) { if ( bl1_is_lower( uplo ) ) { n_iter = bl1_min( m, n ); n_elem_max = m; lda = a_cs; inca = a_rs; ldb = b_cs; incb = b_rs; n_elem_is_descending = TRUE; } else // if ( bl1_is_upper( uplo ) ) { n_iter = n; n_elem_max = bl1_min( m, n ); lda = a_cs; inca = a_rs; ldb = b_cs; incb = b_rs; n_elem_is_descending = FALSE; } } else // if ( bl1_is_row_storage( b_rs, b_cs ) ) { if ( bl1_is_lower( uplo ) ) { n_iter = m; n_elem_max = bl1_min( m, n ); lda = a_rs; inca = a_cs; ldb = b_rs; incb = b_cs; n_elem_is_descending = FALSE; } else // if ( bl1_is_upper( uplo ) ) { n_iter = bl1_min( m, n ); n_elem_max = n; lda = a_rs; inca = a_cs; ldb = b_rs; incb = b_cs; n_elem_is_descending = TRUE; } } // Swap lda and inca if we're doing a transpose. if ( bl1_does_trans( trans ) ) { bl1_swap_ints( lda, inca ); } // Extract conj component from trans parameter. conj = bl1_proj_trans1_to_conj( trans ); // Choose the loop based on whether n_elem will be shrinking or growing // with each iteration. if ( n_elem_is_descending ) { for ( j = 0; j < n_iter; j++ ) { n_elem = n_elem_max - j; a_begin = a + j*lda + j*inca; b_begin = b + j*ldb + j*incb; bl1_zaxpyv( conj, n_elem, alpha, a_begin, inca, b_begin, incb ); } } else // if ( n_elem_is_ascending ) { for ( j = 0; j < n_iter; j++ ) { n_elem = bl1_min( j + 1, n_elem_max ); a_begin = a + j*lda; b_begin = b + j*ldb; bl1_zaxpyv( conj, n_elem, alpha, a_begin, inca, b_begin, incb ); } } }