@@ -212,47 +212,56 @@ v_clz_i32_u32 v5, v1 row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 fi:0
212
212
v_clz_i32_u32 v255, v255 row_xmask:15 row_mask:0x3 bank_mask:0x0 bound_ctrl:0 fi:1
213
213
// GFX11: v_clz_i32_u32_dpp v255, v255 row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1 ; encoding: [0xfa,0x72,0xfe,0x7f,0xff,0x6f,0x05,0x30]
214
214
215
- v_cos_f16 v5, v1 quad_perm:[3 ,2 ,1 ,0 ]
216
- // GFX11: v_cos_f16_dpp v5, v1 quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x1b,0x00,0xff]
215
+ v_cos_f16 v5.l , v1.l quad_perm:[3 ,2 ,1 ,0 ]
216
+ // GFX11: v_cos_f16_dpp v5.l , v1.l quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x1b,0x00,0xff]
217
217
218
- v_cos_f16 v5, v1 quad_perm:[0 ,1 ,2 ,3 ]
219
- // GFX11: v_cos_f16_dpp v5, v1 quad_perm:[0 ,1 ,2 ,3 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0xe4,0x00,0xff]
218
+ v_cos_f16 v5.l , v1.l quad_perm:[0 ,1 ,2 ,3 ]
219
+ // GFX11: v_cos_f16_dpp v5.l , v1.l quad_perm:[0 ,1 ,2 ,3 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0xe4,0x00,0xff]
220
220
221
- v_cos_f16 v5, v1 row_mirror
222
- // GFX11: v_cos_f16_dpp v5, v1 row_mirror row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x40,0x01,0xff]
221
+ v_cos_f16 v5.l , v1.l row_mirror
222
+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_mirror row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x40,0x01,0xff]
223
223
224
- v_cos_f16 v5, v1 row_half_mirror
225
- // GFX11: v_cos_f16_dpp v5, v1 row_half_mirror row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x41,0x01,0xff]
224
+ v_cos_f16 v5.l , v1.l row_half_mirror
225
+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_half_mirror row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x41,0x01,0xff]
226
226
227
- v_cos_f16 v5, v1 row_shl:1
228
- // GFX11: v_cos_f16_dpp v5, v1 row_shl:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x01,0x01,0xff]
227
+ v_cos_f16 v5.l , v1.l row_shl:1
228
+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_shl:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x01,0x01,0xff]
229
229
230
- v_cos_f16 v5, v1 row_shl:15
231
- // GFX11: v_cos_f16_dpp v5, v1 row_shl:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x0f,0x01,0xff]
230
+ v_cos_f16 v5.l , v1.l row_shl:15
231
+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_shl:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x0f,0x01,0xff]
232
232
233
- v_cos_f16 v5, v1 row_shr:1
234
- // GFX11: v_cos_f16_dpp v5, v1 row_shr:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x11,0x01,0xff]
233
+ v_cos_f16 v5.l , v1.l row_shr:1
234
+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_shr:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x11,0x01,0xff]
235
235
236
- v_cos_f16 v5, v1 row_shr:15
237
- // GFX11: v_cos_f16_dpp v5, v1 row_shr:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x1f,0x01,0xff]
236
+ v_cos_f16 v5.l , v1.l row_shr:15
237
+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_shr:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x1f,0x01,0xff]
238
238
239
- v_cos_f16 v5, v1 row_ror:1
240
- // GFX11: v_cos_f16_dpp v5, v1 row_ror:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x21,0x01,0xff]
239
+ v_cos_f16 v5.l , v1.l row_ror:1
240
+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_ror:1 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x21,0x01,0xff]
241
241
242
- v_cos_f16 v5, v1 row_ror:15
243
- // GFX11: v_cos_f16_dpp v5, v1 row_ror:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x2f,0x01,0xff]
242
+ v_cos_f16 v5.l , v1.l row_ror:15
243
+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_ror:15 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x2f,0x01,0xff]
244
244
245
- v_cos_f16 v5, v1 row_share:0 row_mask:0xf bank_mask:0xf
246
- // GFX11: v_cos_f16_dpp v5, v1 row_share:0 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x50,0x01,0xff]
245
+ v_cos_f16 v5.l , v1.l row_share:0 row_mask:0xf bank_mask:0xf
246
+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_share:0 row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x50,0x01,0xff]
247
247
248
- v_cos_f16 v5, v1 row_share:15 row_mask:0x0 bank_mask:0x1
249
- // GFX11: v_cos_f16_dpp v5, v1 row_share:15 row_mask:0x0 bank_mask:0x1 ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x5f,0x01,0x01]
248
+ v_cos_f16 v5.l , v1.l row_share:15 row_mask:0x0 bank_mask:0x1
249
+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_share:15 row_mask:0x0 bank_mask:0x1 ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x5f,0x01,0x01]
250
250
251
- v_cos_f16 v5, v1 row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 fi: 0
252
- // GFX11: v_cos_f16_dpp v5, v1 row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x60,0x09,0x13]
251
+ v_cos_f16 v5.l , v1.l row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1
252
+ // GFX11: v_cos_f16_dpp v5.l , v1.l row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 ; encoding: [0xfa,0xc2,0x0a,0x7e,0x01,0x60,0x09,0x13]
253
253
254
- v_cos_f16 v127, -|v127| row_xmask:15 row_mask:0x3 bank_mask:0x0 bound_ctrl:0 fi:1
255
- // GFX11: v_cos_f16_dpp v127, -|v127| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1 ; encoding: [0xfa,0xc2,0xfe,0x7e,0x7f,0x6f,0x35,0x30]
254
+ v_cos_f16 v127.l, -|v127.l| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1
255
+ // GFX11: v_cos_f16_dpp v127.l, -|v127.l| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1 ; encoding: [0xfa,0xc2,0xfe,0x7e,0x7f,0x6f,0x35,0x30]
256
+
257
+ v_cos_f16 v127.l, v127.l row_share:15 row_mask:0x0 bank_mask:0x1
258
+ // GFX11: v_cos_f16_dpp v127.l, v127.l row_share:15 row_mask:0x0 bank_mask:0x1 ; encoding: [0xfa,0xc2,0xfe,0x7e,0x7f,0x5f,0x01,0x01]
259
+
260
+ v_cos_f16 v5.h, v1.h row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 fi:0
261
+ // GFX11: v_cos_f16_dpp v5.h, v1.h row_xmask:0 row_mask:0x1 bank_mask:0x3 bound_ctrl:1 ; encoding: [0xfa,0xc2,0x0a,0x7f,0x81,0x60,0x09,0x13]
262
+
263
+ v_cos_f16 v127.h, -|v127.h| row_xmask:15 row_mask:0x3 bank_mask:0x0 bound_ctrl:0 fi:1
264
+ // GFX11: v_cos_f16_dpp v127.h, -|v127.h| row_xmask:15 row_mask:0x3 bank_mask:0x0 fi:1 ; encoding: [0xfa,0xc2,0xfe,0x7f,0xff,0x6f,0x35,0x30]
256
265
257
266
v_cos_f32 v5, v1 quad_perm:[3 ,2 ,1 ,0 ]
258
267
// GFX11: v_cos_f32_dpp v5, v1 quad_perm:[3 ,2 ,1 ,0 ] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0x6c,0x0a,0x7e,0x01,0x1b,0x00,0xff]
0 commit comments