|
1 | 1 | #pragma OPENCL EXTENSION cl_khr_fp16 : enable
|
2 | 2 |
|
3 | 3 | // CHECK-LABEL: test_fract_f16
|
4 |
| -// GFX600: v_cvt_f32_f16 |
5 |
| -// GFX600-DAG: v_floor_f32 |
6 |
| -// GFX600-DAG: v_sub_f32 |
7 |
| -// GFX600-DAG: v_min_f32_e32 v{{[0-9]+}}, 0x3f7fe000, |
8 |
| -// GFX600-DAG: v_cmp_u_f32 |
9 |
| -// GFX600-DAG: v_cmp_neq_f32 |
10 |
| -// GFX600-DAG: v_cndmask_b32 |
11 |
| -// GFX600-DAG: v_cvt_f16_f32 |
12 |
| -// GFX600-DAG: v_cvt_f16_f32 |
| 4 | +// GFX600-DAG: s_add_u32 |
| 5 | +// GFX600-DAG: s_addc_u32 |
| 6 | +// GFX600: buffer_load_ushort |
| 7 | +// GFX600-DAG: v_lshlrev_b32 |
| 8 | +// GFX600-DAG: v_mov_b32 |
| 9 | +// GFX600-DAG: s_mov_b32 |
| 10 | +// GFX600-DAG: s_mov_b32 |
| 11 | +// GFX600: s_waitcnt |
| 12 | +// GFX600: buffer_store_short |
13 | 13 |
|
14 | 14 |
|
15 | 15 | // TODO: Could promote the f16 pattern to f32
|
16 |
| -// GFX700: flat_load_ushort [[VAL:v[0-9]+]] |
17 |
| -// GFX700: v_cvt_f32_f16_e32 [[VAL_F32:v[0-9]+]] |
18 |
| -// GFX700-DAG: v_floor_f32_e32 [[FLOOR:v[0-9]+]], [[VAL_F32]] |
19 |
| -// GFX700: v_sub_f32_e32 [[SUB:v[0-9]+]], [[VAL_F32]], [[FLOOR]] |
20 |
| - |
21 |
| -// GFX700-DAG: v_min_f32_e32 [[CLAMP:v[0-9]+]], 0x3f7fe000, [[SUB]] |
22 |
| -// GFX700-DAG: v_cmp_u_f32 |
23 |
| -// GFX700-DAG: v_cmp_neq_f32 |
24 |
| -// GFX700-DAG: v_cndmask_b32 |
25 |
| -// GFX700-DAG: v_cvt_f16_f32 |
26 |
| -// GFX700-DAG: v_cvt_f16_f32 |
| 16 | +// GFX700-DAG: s_add_i32 |
| 17 | +// GFX700-DAG: s_lshr_b32 |
| 18 | +// GFX700-DAG: s_add_u32 |
| 19 | +// GFX700-DAG: s_addc_u32 |
| 20 | +// GFX700: buffer_load_ushort |
| 21 | +// GFX700-DAG: s_load_dwordx2 |
| 22 | +// GFX700-DAG: v_lshlrev_b32 |
| 23 | +// GFX700-DAG: s_mov_b32 |
| 24 | +// GFX700-DAG: s_waitcnt |
| 25 | +// GFX700-DAG: v_mov_b32 |
| 26 | +// GFX700-DAG: v_add_i32 |
| 27 | +// GFX700-DAG: v_addc_u32 |
| 28 | +// GFX700: s_waitcnt |
| 29 | +// GFX700: flat_store_short |
| 30 | + |
27 | 31 |
|
28 | 32 | // GFX803: flat_load_ushort [[VAL:v[0-9]+]]
|
29 | 33 | // GFX803-DAG: v_floor_f16_e32 [[FLOOR:v[0-9]+]], [[VAL]]
|
|
0 commit comments