| 
    libflame
    12600
    
   
   | 
  
  
  
 
Functions | |
| FLA_Error | FLA_Trsv_external_gpu (FLA_Uplo uplo, FLA_Trans trans, FLA_Diag diag, FLA_Obj A, void *A_gpu, FLA_Obj x, void *x_gpu) | 
| FLA_Error FLA_Trsv_external_gpu | ( | FLA_Uplo | uplo, | 
| FLA_Trans | trans, | ||
| FLA_Diag | diag, | ||
| FLA_Obj | A, | ||
| void * | A_gpu, | ||
| FLA_Obj | x, | ||
| void * | x_gpu | ||
| ) | 
References FLA_Check_error_level(), FLA_Obj_datatype(), FLA_Obj_has_zero_dim(), FLA_Obj_length(), FLA_Param_map_flame_to_netlib_diag(), FLA_Param_map_flame_to_netlib_trans(), FLA_Param_map_flame_to_netlib_uplo(), and FLA_Trsv_check().
Referenced by FLASH_Queue_exec_task_gpu().
{
  FLA_Datatype datatype;
  int          m_A;
  int          ldim_A;
  int          inc_x;
  char         blas_uplo;
  char         blas_trans;
  char         blas_diag;
  if ( FLA_Check_error_level() == FLA_FULL_ERROR_CHECKING ) 
    FLA_Trsv_check( uplo, trans, diag, A, x );
  if ( FLA_Obj_has_zero_dim( A ) ) return FLA_SUCCESS;
  datatype = FLA_Obj_datatype( A );
  m_A      = FLA_Obj_length( A );
  ldim_A   = FLA_Obj_length( A );
  inc_x    = 1;
  FLA_Param_map_flame_to_netlib_uplo( uplo, &blas_uplo );
  FLA_Param_map_flame_to_netlib_trans( trans, &blas_trans );
  FLA_Param_map_flame_to_netlib_diag( diag, &blas_diag );
  switch( datatype ){
  case FLA_FLOAT:
  {
    cublasStrsv( blas_uplo,
                 blas_trans,
                 blas_diag,
                 m_A,
                 ( float * ) A_gpu, ldim_A,
                 ( float * ) x_gpu, inc_x );
    break;
  }
  case FLA_DOUBLE:
  {
    cublasDtrsv( blas_uplo,
                 blas_trans,
                 blas_diag,
                 m_A,
                 ( double * ) A_gpu, ldim_A,
                 ( double * ) x_gpu, inc_x );
    break;
  }
  case FLA_COMPLEX:
  {
    cublasCtrsv( blas_uplo,
                 blas_trans,
                 blas_diag,
                 m_A,
                 ( cuComplex * ) A_gpu, ldim_A,
                 ( cuComplex * ) x_gpu, inc_x );
    break;
  }
  case FLA_DOUBLE_COMPLEX:
  {
    cublasZtrsv( blas_uplo,
                 blas_trans,
                 blas_diag,
                 m_A,
                 ( cuDoubleComplex * ) A_gpu, ldim_A,
                 ( cuDoubleComplex * ) x_gpu, inc_x );
    break;
  }
  }
  return FLA_SUCCESS;
}
 1.7.6.1