libflame revision_anchor
Functions
FLA_CAQR2_UT_opt_var1.c File Reference

(r)

Functions

FLA_Error FLA_CAQR2_UT_opt_var1 (FLA_Obj U, FLA_Obj D, FLA_Obj T)
 
FLA_Error FLA_CAQR2_UT_ops_var1 (int mn_UT, int m_D, float *buff_U, int rs_U, int cs_U, float *buff_D, int rs_D, int cs_D, float *buff_T, int rs_T, int cs_T)
 
FLA_Error FLA_CAQR2_UT_opd_var1 (int mn_UT, int m_D, double *buff_U, int rs_U, int cs_U, double *buff_D, int rs_D, int cs_D, double *buff_T, int rs_T, int cs_T)
 
FLA_Error FLA_CAQR2_UT_opc_var1 (int mn_UT, int m_D, scomplex *buff_U, int rs_U, int cs_U, scomplex *buff_D, int rs_D, int cs_D, scomplex *buff_T, int rs_T, int cs_T)
 
FLA_Error FLA_CAQR2_UT_opz_var1 (int mn_UT, int m_D, dcomplex *buff_U, int rs_U, int cs_U, dcomplex *buff_D, int rs_D, int cs_D, dcomplex *buff_T, int rs_T, int cs_T)
 

Function Documentation

◆ FLA_CAQR2_UT_opc_var1()

FLA_Error FLA_CAQR2_UT_opc_var1 ( int  mn_UT,
int  m_D,
scomplex buff_U,
int  rs_U,
int  cs_U,
scomplex buff_D,
int  rs_D,
int  cs_D,
scomplex buff_T,
int  rs_T,
int  cs_T 
)
270{
272 int i, j;
273 int m_DT = m_D - mn_UT;
274
275 for ( i = m_DT, j = 0; j < mn_UT; ++i, ++j )
276 {
277 scomplex* upsilon11 = buff_U + (j )*cs_U + (j )*rs_U;
278 scomplex* u12t = buff_U + (j+1)*cs_U + (j )*rs_U;
279
280 scomplex* D00 = buff_D + (0 )*cs_D + (0 )*rs_D;
281 scomplex* d1 = buff_D + (j )*cs_D + (0 )*rs_D;
282 scomplex* D2 = buff_D + (j+1)*cs_D + (0 )*rs_D;
283
284 scomplex* tau11 = buff_T + (j )*cs_T + (j )*rs_T;
285 scomplex* t01 = buff_T + (j )*cs_T + (0 )*rs_T;
286
287 scomplex* d1B = d1 + (m_DT)*rs_D;
288 scomplex* D00B = D00 + (m_DT)*rs_D;
289
290 int m_behind = i;
291 int n_behind = j;
292 int mn_ahead = mn_UT - j - 1;
293
294 //------------------------------------------------------------//
295
296 // FLA_Househ2_UT( FLA_LEFT,
297 // upsilon11,
298 // d1, tau11 );
300 upsilon11,
301 d1, rs_D,
302 tau11 );
303
304 // FLA_Apply_H2_UT( FLA_LEFT, tau11, d1, u12t,
305 // D2 );
307 mn_ahead,
308 tau11,
309 d1, rs_D,
310 u12t, cs_U,
311 D2, rs_D, cs_D );
312
313 // FLA_Copy_external( d01B, t01 );
314 // FLA_Trmv_external( FLA_UPPER_TRIANGULAR, FLA_CONJ_TRANSPOSE, FLA_NONUNIT_DIAG,
315 // D00B, t01 );
316 // FLA_Gemv_external( FLA_CONJ_TRANSPOSE, FLA_ONE, D00T, d01T, FLA_ONE, t01 );
318 n_behind,
319 d1B, rs_D,
320 t01, rs_T );
324 n_behind,
325 D00B, rs_D, cs_D,
326 t01, rs_T );
329 m_DT,
330 n_behind,
331 buff_1,
332 D00, rs_D, cs_D,
333 d1, rs_D,
334 buff_1,
335 t01, rs_T );
336
337 //------------------------------------------------------------//
338
339 }
340
341 return FLA_SUCCESS;
342}
FLA_Error FLA_Apply_H2_UT_l_opc_var1(int m_u2_A2, int n_a1t, scomplex *tau, scomplex *u2, int inc_u2, scomplex *a1t, int inc_a1t, scomplex *A2, int rs_A2, int cs_A2)
Definition FLA_Apply_H2_UT_l_opt_var1.c:269
FLA_Obj FLA_ONE
Definition FLA_Init.c:18
FLA_Error FLA_Househ2_UT_l_opc(int m_x2, scomplex *chi_1, scomplex *x2, int inc_x2, scomplex *tau)
Definition FLA_Househ2_UT.c:390
int i
Definition bl1_axmyv2.c:145
void bl1_ccopyv(conj1_t conj, int m, scomplex *x, int incx, scomplex *y, int incy)
Definition bl1_copyv.c:49
void bl1_cgemv(trans1_t transa, conj1_t conjx, int m, int n, scomplex *alpha, scomplex *a, int a_rs, int a_cs, scomplex *x, int incx, scomplex *beta, scomplex *y, int incy)
Definition bl1_gemv.c:125
void bl1_ctrmv(uplo1_t uplo, trans1_t trans, diag1_t diag, int m, scomplex *a, int a_rs, int a_cs, scomplex *x, int incx)
Definition bl1_trmv.c:99
@ BLIS1_UPPER_TRIANGULAR
Definition blis_type_defs.h:63
@ BLIS1_NONUNIT_DIAG
Definition blis_type_defs.h:74
@ BLIS1_CONJ_TRANSPOSE
Definition blis_type_defs.h:57
@ BLIS1_NO_CONJUGATE
Definition blis_type_defs.h:81
Definition blis_type_defs.h:133

References bl1_ccopyv(), bl1_cgemv(), bl1_ctrmv(), BLIS1_CONJ_TRANSPOSE, BLIS1_NO_CONJUGATE, BLIS1_NONUNIT_DIAG, BLIS1_UPPER_TRIANGULAR, FLA_Apply_H2_UT_l_opc_var1(), FLA_Househ2_UT_l_opc(), FLA_ONE, and i.

Referenced by FLA_CAQR2_UT_opt_var1().

◆ FLA_CAQR2_UT_opd_var1()

FLA_Error FLA_CAQR2_UT_opd_var1 ( int  mn_UT,
int  m_D,
double buff_U,
int  rs_U,
int  cs_U,
double buff_D,
int  rs_D,
int  cs_D,
double buff_T,
int  rs_T,
int  cs_T 
)
189{
190 double* buff_1 = FLA_DOUBLE_PTR( FLA_ONE );
191 int i, j;
192 int m_DT = m_D - mn_UT;
193
194 for ( i = m_DT, j = 0; j < mn_UT; ++i, ++j )
195 {
196 double* upsilon11 = buff_U + (j )*cs_U + (j )*rs_U;
197 double* u12t = buff_U + (j+1)*cs_U + (j )*rs_U;
198
199 double* D00 = buff_D + (0 )*cs_D + (0 )*rs_D;
200 double* d1 = buff_D + (j )*cs_D + (0 )*rs_D;
201 double* D2 = buff_D + (j+1)*cs_D + (0 )*rs_D;
202
203 double* tau11 = buff_T + (j )*cs_T + (j )*rs_T;
204 double* t01 = buff_T + (j )*cs_T + (0 )*rs_T;
205
206 double* d1B = d1 + (m_DT)*rs_D;
207 double* D00B = D00 + (m_DT)*rs_D;
208
209 int m_behind = i;
210 int n_behind = j;
211 int mn_ahead = mn_UT - j - 1;
212
213 //------------------------------------------------------------//
214
215 // FLA_Househ2_UT( FLA_LEFT,
216 // upsilon11,
217 // d1, tau11 );
219 upsilon11,
220 d1, rs_D,
221 tau11 );
222
223 // FLA_Apply_H2_UT( FLA_LEFT, tau11, d1, u12t,
224 // D2 );
226 mn_ahead,
227 tau11,
228 d1, rs_D,
229 u12t, cs_U,
230 D2, rs_D, cs_D );
231
232 // FLA_Copy_external( d01B, t01 );
233 // FLA_Trmv_external( FLA_UPPER_TRIANGULAR, FLA_CONJ_TRANSPOSE, FLA_NONUNIT_DIAG,
234 // D00B, t01 );
235 // FLA_Gemv_external( FLA_CONJ_TRANSPOSE, FLA_ONE, D00T, d01T, FLA_ONE, t01 );
237 n_behind,
238 d1B, rs_D,
239 t01, rs_T );
243 n_behind,
244 D00B, rs_D, cs_D,
245 t01, rs_T );
248 m_DT,
249 n_behind,
250 buff_1,
251 D00, rs_D, cs_D,
252 d1, rs_D,
253 buff_1,
254 t01, rs_T );
255
256 //------------------------------------------------------------//
257
258 }
259
260 return FLA_SUCCESS;
261}
FLA_Error FLA_Apply_H2_UT_l_opd_var1(int m_u2_A2, int n_a1t, double *tau, double *u2, int inc_u2, double *a1t, int inc_a1t, double *A2, int rs_A2, int cs_A2)
Definition FLA_Apply_H2_UT_l_opt_var1.c:195
FLA_Error FLA_Househ2_UT_l_opd(int m_x2, double *chi_1, double *x2, int inc_x2, double *tau)
Definition FLA_Househ2_UT.c:274
void bl1_dcopyv(conj1_t conj, int m, double *x, int incx, double *y, int incy)
Definition bl1_copyv.c:42
void bl1_dgemv(trans1_t transa, conj1_t conjx, int m, int n, double *alpha, double *a, int a_rs, int a_cs, double *x, int incx, double *beta, double *y, int incy)
Definition bl1_gemv.c:69
void bl1_dtrmv(uplo1_t uplo, trans1_t trans, diag1_t diag, int m, double *a, int a_rs, int a_cs, double *x, int incx)
Definition bl1_trmv.c:56

References bl1_dcopyv(), bl1_dgemv(), bl1_dtrmv(), BLIS1_CONJ_TRANSPOSE, BLIS1_NO_CONJUGATE, BLIS1_NONUNIT_DIAG, BLIS1_UPPER_TRIANGULAR, FLA_Apply_H2_UT_l_opd_var1(), FLA_Househ2_UT_l_opd(), FLA_ONE, and i.

Referenced by FLA_CAQR2_UT_opt_var1().

◆ FLA_CAQR2_UT_ops_var1()

FLA_Error FLA_CAQR2_UT_ops_var1 ( int  mn_UT,
int  m_D,
float buff_U,
int  rs_U,
int  cs_U,
float buff_D,
int  rs_D,
int  cs_D,
float buff_T,
int  rs_T,
int  cs_T 
)
108{
109 float* buff_1 = FLA_FLOAT_PTR( FLA_ONE );
110 int i, j;
111 int m_DT = m_D - mn_UT;
112
113 for ( i = m_DT, j = 0; j < mn_UT; ++i, ++j )
114 {
115 float* upsilon11 = buff_U + (j )*cs_U + (j )*rs_U;
116 float* u12t = buff_U + (j+1)*cs_U + (j )*rs_U;
117
118 float* D00 = buff_D + (0 )*cs_D + (0 )*rs_D;
119 float* d1 = buff_D + (j )*cs_D + (0 )*rs_D;
120 float* D2 = buff_D + (j+1)*cs_D + (0 )*rs_D;
121
122 float* tau11 = buff_T + (j )*cs_T + (j )*rs_T;
123 float* t01 = buff_T + (j )*cs_T + (0 )*rs_T;
124
125 float* d1B = d1 + (m_DT)*rs_D;
126 float* D00B = D00 + (m_DT)*rs_D;
127
128 int m_behind = i;
129 int n_behind = j;
130 int mn_ahead = mn_UT - j - 1;
131
132 //------------------------------------------------------------//
133
134 // FLA_Househ2_UT( FLA_LEFT,
135 // upsilon11,
136 // d1, tau11 );
138 upsilon11,
139 d1, rs_D,
140 tau11 );
141
142 // FLA_Apply_H2_UT( FLA_LEFT, tau11, d1, u12t,
143 // D2 );
145 mn_ahead,
146 tau11,
147 d1, rs_D,
148 u12t, cs_U,
149 D2, rs_D, cs_D );
150
151 // FLA_Copy_external( d01B, t01 );
152 // FLA_Trmv_external( FLA_UPPER_TRIANGULAR, FLA_CONJ_TRANSPOSE, FLA_NONUNIT_DIAG,
153 // D00B, t01 );
154 // FLA_Gemv_external( FLA_CONJ_TRANSPOSE, FLA_ONE, D00T, d01T, FLA_ONE, t01 );
156 n_behind,
157 d1B, rs_D,
158 t01, rs_T );
162 n_behind,
163 D00B, rs_D, cs_D,
164 t01, rs_T );
167 m_DT,
168 n_behind,
169 buff_1,
170 D00, rs_D, cs_D,
171 d1, rs_D,
172 buff_1,
173 t01, rs_T );
174
175 //------------------------------------------------------------//
176
177 }
178
179 return FLA_SUCCESS;
180}
FLA_Error FLA_Apply_H2_UT_l_ops_var1(int m_u2_A2, int n_a1t, float *tau, float *u2, int inc_u2, float *a1t, int inc_a1t, float *A2, int rs_A2, int cs_A2)
Definition FLA_Apply_H2_UT_l_opt_var1.c:121
FLA_Error FLA_Househ2_UT_l_ops(int m_x2, float *chi_1, float *x2, int inc_x2, float *tau)
Definition FLA_Househ2_UT.c:160
void bl1_scopyv(conj1_t conj, int m, float *x, int incx, float *y, int incy)
Definition bl1_copyv.c:35
void bl1_sgemv(trans1_t transa, conj1_t conjx, int m, int n, float *alpha, float *a, int a_rs, int a_cs, float *x, int incx, float *beta, float *y, int incy)
Definition bl1_gemv.c:13
void bl1_strmv(uplo1_t uplo, trans1_t trans, diag1_t diag, int m, float *a, int a_rs, int a_cs, float *x, int incx)
Definition bl1_trmv.c:13

References bl1_scopyv(), bl1_sgemv(), bl1_strmv(), BLIS1_CONJ_TRANSPOSE, BLIS1_NO_CONJUGATE, BLIS1_NONUNIT_DIAG, BLIS1_UPPER_TRIANGULAR, FLA_Apply_H2_UT_l_ops_var1(), FLA_Househ2_UT_l_ops(), FLA_ONE, and i.

Referenced by FLA_CAQR2_UT_opt_var1().

◆ FLA_CAQR2_UT_opt_var1()

FLA_Error FLA_CAQR2_UT_opt_var1 ( FLA_Obj  U,
FLA_Obj  D,
FLA_Obj  T 
)
15{
16 FLA_Datatype datatype;
17 int mn_UT, m_D;
18 int rs_U, cs_U;
19 int rs_D, cs_D;
20 int rs_T, cs_T;
21
22 datatype = FLA_Obj_datatype( U );
23
25 m_D = FLA_Obj_length( D );
26
33
34
35 switch ( datatype )
36 {
37 case FLA_FLOAT:
38 {
39 float* buff_U = FLA_FLOAT_PTR( U );
40 float* buff_D = FLA_FLOAT_PTR( D );
41 float* buff_T = FLA_FLOAT_PTR( T );
42
44 m_D,
47 buff_T, rs_T, cs_T );
48
49 break;
50 }
51
52 case FLA_DOUBLE:
53 {
54 double* buff_U = FLA_DOUBLE_PTR( U );
55 double* buff_D = FLA_DOUBLE_PTR( D );
56 double* buff_T = FLA_DOUBLE_PTR( T );
57
59 m_D,
62 buff_T, rs_T, cs_T );
63
64 break;
65 }
66
67 case FLA_COMPLEX:
68 {
72
74 m_D,
77 buff_T, rs_T, cs_T );
78
79 break;
80 }
81
83 {
87
89 m_D,
92 buff_T, rs_T, cs_T );
93
94 break;
95 }
96 }
97
98 return FLA_SUCCESS;
99}
FLA_Error FLA_CAQR2_UT_opd_var1(int mn_UT, int m_D, double *buff_U, int rs_U, int cs_U, double *buff_D, int rs_D, int cs_D, double *buff_T, int rs_T, int cs_T)
Definition FLA_CAQR2_UT_opt_var1.c:184
FLA_Error FLA_CAQR2_UT_opz_var1(int mn_UT, int m_D, dcomplex *buff_U, int rs_U, int cs_U, dcomplex *buff_D, int rs_D, int cs_D, dcomplex *buff_T, int rs_T, int cs_T)
Definition FLA_CAQR2_UT_opt_var1.c:346
FLA_Error FLA_CAQR2_UT_opc_var1(int mn_UT, int m_D, scomplex *buff_U, int rs_U, int cs_U, scomplex *buff_D, int rs_D, int cs_D, scomplex *buff_T, int rs_T, int cs_T)
Definition FLA_CAQR2_UT_opt_var1.c:265
FLA_Error FLA_CAQR2_UT_ops_var1(int mn_UT, int m_D, float *buff_U, int rs_U, int cs_U, float *buff_D, int rs_D, int cs_D, float *buff_T, int rs_T, int cs_T)
Definition FLA_CAQR2_UT_opt_var1.c:103
dim_t FLA_Obj_width(FLA_Obj obj)
Definition FLA_Query.c:123
dim_t FLA_Obj_row_stride(FLA_Obj obj)
Definition FLA_Query.c:167
dim_t FLA_Obj_length(FLA_Obj obj)
Definition FLA_Query.c:116
dim_t FLA_Obj_col_stride(FLA_Obj obj)
Definition FLA_Query.c:174
FLA_Datatype FLA_Obj_datatype(FLA_Obj obj)
Definition FLA_Query.c:13
int FLA_Datatype
Definition FLA_type_defs.h:49
Definition blis_type_defs.h:138

References FLA_CAQR2_UT_opc_var1(), FLA_CAQR2_UT_opd_var1(), FLA_CAQR2_UT_ops_var1(), FLA_CAQR2_UT_opz_var1(), FLA_Obj_col_stride(), FLA_Obj_datatype(), FLA_Obj_length(), FLA_Obj_row_stride(), FLA_Obj_width(), and i.

Referenced by FLA_CAQR2_UT_internal().

◆ FLA_CAQR2_UT_opz_var1()

FLA_Error FLA_CAQR2_UT_opz_var1 ( int  mn_UT,
int  m_D,
dcomplex buff_U,
int  rs_U,
int  cs_U,
dcomplex buff_D,
int  rs_D,
int  cs_D,
dcomplex buff_T,
int  rs_T,
int  cs_T 
)
351{
353 int i, j;
354 int m_DT = m_D - mn_UT;
355
356 for ( i = m_DT, j = 0; j < mn_UT; ++i, ++j )
357 {
358 dcomplex* upsilon11 = buff_U + (j )*cs_U + (j )*rs_U;
359 dcomplex* u12t = buff_U + (j+1)*cs_U + (j )*rs_U;
360
361 dcomplex* D00 = buff_D + (0 )*cs_D + (0 )*rs_D;
362 dcomplex* d1 = buff_D + (j )*cs_D + (0 )*rs_D;
363 dcomplex* D2 = buff_D + (j+1)*cs_D + (0 )*rs_D;
364
365 dcomplex* tau11 = buff_T + (j )*cs_T + (j )*rs_T;
366 dcomplex* t01 = buff_T + (j )*cs_T + (0 )*rs_T;
367
368 dcomplex* d1B = d1 + (m_DT)*rs_D;
369 dcomplex* D00B = D00 + (m_DT)*rs_D;
370
371 int m_behind = i;
372 int n_behind = j;
373 int mn_ahead = mn_UT - j - 1;
374
375 //------------------------------------------------------------//
376
377 // FLA_Househ2_UT( FLA_LEFT,
378 // upsilon11,
379 // d1, tau11 );
381 upsilon11,
382 d1, rs_D,
383 tau11 );
384
385 // FLA_Apply_H2_UT( FLA_LEFT, tau11, d1, u12t,
386 // D2 );
388 mn_ahead,
389 tau11,
390 d1, rs_D,
391 u12t, cs_U,
392 D2, rs_D, cs_D );
393
394 // FLA_Copy_external( d01B, t01 );
395 // FLA_Trmv_external( FLA_UPPER_TRIANGULAR, FLA_CONJ_TRANSPOSE, FLA_NONUNIT_DIAG,
396 // D00B, t01 );
397 // FLA_Gemv_external( FLA_CONJ_TRANSPOSE, FLA_ONE, D00T, d01T, FLA_ONE, t01 );
399 n_behind,
400 d1B, rs_D,
401 t01, rs_T );
405 n_behind,
406 D00B, rs_D, cs_D,
407 t01, rs_T );
410 m_DT,
411 n_behind,
412 buff_1,
413 D00, rs_D, cs_D,
414 d1, rs_D,
415 buff_1,
416 t01, rs_T );
417
418 //------------------------------------------------------------//
419
420 }
421
422 return FLA_SUCCESS;
423}
FLA_Error FLA_Apply_H2_UT_l_opz_var1(int m_u2_A2, int n_a1t, dcomplex *tau, dcomplex *u2, int inc_u2, dcomplex *a1t, int inc_a1t, dcomplex *A2, int rs_A2, int cs_A2)
Definition FLA_Apply_H2_UT_l_opt_var1.c:343
FLA_Error FLA_Househ2_UT_l_opz(int m_x2, dcomplex *chi_1, dcomplex *x2, int inc_x2, dcomplex *tau)
Definition FLA_Househ2_UT.c:521
void bl1_zcopyv(conj1_t conj, int m, dcomplex *x, int incx, dcomplex *y, int incy)
Definition bl1_copyv.c:63
void bl1_zgemv(trans1_t transa, conj1_t conjx, int m, int n, dcomplex *alpha, dcomplex *a, int a_rs, int a_cs, dcomplex *x, int incx, dcomplex *beta, dcomplex *y, int incy)
Definition bl1_gemv.c:255
void bl1_ztrmv(uplo1_t uplo, trans1_t trans, diag1_t diag, int m, dcomplex *a, int a_rs, int a_cs, dcomplex *x, int incx)
Definition bl1_trmv.c:177

References bl1_zcopyv(), bl1_zgemv(), bl1_ztrmv(), BLIS1_CONJ_TRANSPOSE, BLIS1_NO_CONJUGATE, BLIS1_NONUNIT_DIAG, BLIS1_UPPER_TRIANGULAR, FLA_Apply_H2_UT_l_opz_var1(), FLA_Househ2_UT_l_opz(), FLA_ONE, and i.

Referenced by FLA_CAQR2_UT_opt_var1().