libflame revision_anchor
Functions
FLA_Symm_external_gpu.c File Reference

(r)

Functions

FLA_Error FLA_Symm_external_gpu (FLA_Side side, FLA_Uplo uplo, FLA_Obj alpha, FLA_Obj A, void *A_gpu, FLA_Obj B, void *B_gpu, FLA_Obj beta, FLA_Obj C, void *C_gpu)
 

Function Documentation

◆ FLA_Symm_external_gpu()

FLA_Error FLA_Symm_external_gpu ( FLA_Side  side,
FLA_Uplo  uplo,
FLA_Obj  alpha,
FLA_Obj  A,
void A_gpu,
FLA_Obj  B,
void B_gpu,
FLA_Obj  beta,
FLA_Obj  C,
void C_gpu 
)
18{
19 FLA_Datatype datatype;
20 int m_C, n_C;
21 int ldim_A;
22 int ldim_B;
23 int ldim_C;
24 char blas_side;
25 char blas_uplo;
26
28 FLA_Symm_check( side, uplo, alpha, A, B, beta, C );
29
30 if ( FLA_Obj_has_zero_dim( C ) ) return FLA_SUCCESS;
31
32 datatype = FLA_Obj_datatype( A );
33
35
37
38 m_C = FLA_Obj_length( C );
39 n_C = FLA_Obj_width( C );
41
44
45
46 switch( datatype ){
47
48 case FLA_FLOAT:
49 {
50 float *buff_alpha = ( float * ) FLA_FLOAT_PTR( alpha );
51 float *buff_beta = ( float * ) FLA_FLOAT_PTR( beta );
52
55 m_C,
56 n_C,
58 ( float * ) A_gpu, ldim_A,
59 ( float * ) B_gpu, ldim_B,
60 *buff_beta,
61 ( float * ) C_gpu, ldim_C );
62
63 break;
64 }
65
66 case FLA_DOUBLE:
67 {
68 double *buff_alpha = ( double * ) FLA_DOUBLE_PTR( alpha );
69 double *buff_beta = ( double * ) FLA_DOUBLE_PTR( beta );
70
73 m_C,
74 n_C,
76 ( double * ) A_gpu, ldim_A,
77 ( double * ) B_gpu, ldim_B,
78 *buff_beta,
79 ( double * ) C_gpu, ldim_C );
80
81 break;
82 }
83
84 case FLA_COMPLEX:
85 {
88
91 m_C,
92 n_C,
94 ( cuComplex * ) A_gpu, ldim_A,
95 ( cuComplex * ) B_gpu, ldim_B,
96 *buff_beta,
97 ( cuComplex * ) C_gpu, ldim_C );
98
99 break;
100 }
101
103 {
106
108 blas_uplo,
109 m_C,
110 n_C,
111 *buff_alpha,
114 *buff_beta,
116
117 break;
118 }
119
120 }
121
122 return FLA_SUCCESS;
123}
FLA_Error FLA_Symm_check(FLA_Side side, FLA_Uplo uplo, FLA_Obj alpha, FLA_Obj A, FLA_Obj B, FLA_Obj beta, FLA_Obj C)
Definition FLA_Symm_check.c:13
dim_t FLA_Obj_width(FLA_Obj obj)
Definition FLA_Query.c:123
FLA_Bool FLA_Obj_has_zero_dim(FLA_Obj A)
Definition FLA_Query.c:400
dim_t FLA_Obj_length(FLA_Obj obj)
Definition FLA_Query.c:116
unsigned int FLA_Check_error_level(void)
Definition FLA_Check.c:18
void FLA_Param_map_flame_to_netlib_side(FLA_Uplo side, void *blas_side)
Definition FLA_Param.c:71
void FLA_Param_map_flame_to_netlib_uplo(FLA_Uplo uplo, void *blas_uplo)
Definition FLA_Param.c:47
FLA_Datatype FLA_Obj_datatype(FLA_Obj obj)
Definition FLA_Query.c:13
int FLA_Datatype
Definition FLA_type_defs.h:49
int i
Definition bl1_axmyv2.c:145

References FLA_Check_error_level(), FLA_Obj_datatype(), FLA_Obj_has_zero_dim(), FLA_Obj_length(), FLA_Obj_width(), FLA_Param_map_flame_to_netlib_side(), FLA_Param_map_flame_to_netlib_uplo(), FLA_Symm_check(), and i.

Referenced by FLASH_Queue_exec_task_gpu().