@@ -2174,53 +2174,89 @@ v_fma_dx9_zero_f32 v5, -src_scc, |vcc_lo|, -1 mul:4
2174
2174
v_fma_dx9_zero_f32 v255, -|0xaf123456|, -|vcc_hi|, null clamp div:2
2175
2175
// GFX11: v_fma_dx9_zero_f32 v255, -|0xaf123456|, -|vcc_hi|, null clamp div:2 ; encoding: [0xff,0x83,0x09,0xd6,0xff,0xd6,0xf0,0x79,0x56,0x34,0x12,0xaf]
2176
2176
2177
- v_fma_f16 v5, v1, v2, s3
2178
- // GFX11: v_fma_f16 v5, v1, v2, s3 ; encoding: [0x05,0x00,0x48,0xd6,0x01,0x05,0x0e,0x00]
2177
+ v_fma_f16 v5.l , v1.l , v2.l , s3
2178
+ // GFX11: v_fma_f16 v5.l , v1.l , v2.l , s3 ; encoding: [0x05,0x00,0x48,0xd6,0x01,0x05,0x0e,0x00]
2179
2179
2180
- v_fma_f16 v5, v255, s2, s105
2181
- // GFX11: v_fma_f16 v5, v255, s2, s105 ; encoding: [0x05,0x00,0x48,0xd6,0xff,0x05,0xa4,0x01]
2180
+ v_fma_f16 v5.l , v255.l , s2, s105
2181
+ // GFX11: v_fma_f16 v5.l , v255.l , s2, s105 ; encoding: [0x05,0x00,0x48,0xd6,0xff,0x05,0xa4,0x01]
2182
2182
2183
- v_fma_f16 v5, s1, v255, exec_hi
2184
- // GFX11: v_fma_f16 v5, s1, v255, exec_hi ; encoding: [0x05,0x00,0x48,0xd6,0x01,0xfe,0xff,0x01]
2183
+ v_fma_f16 v5.l , s1, v255.l , exec_hi
2184
+ // GFX11: v_fma_f16 v5.l , s1, v255.l , exec_hi ; encoding: [0x05,0x00,0x48,0xd6,0x01,0xfe,0xff,0x01]
2185
2185
2186
- v_fma_f16 v5, s105, s105, exec_lo
2187
- // GFX11: v_fma_f16 v5, s105, s105, exec_lo ; encoding: [0x05,0x00,0x48,0xd6,0x69,0xd2,0xf8,0x01]
2186
+ v_fma_f16 v5.l , s105, s105, exec_lo
2187
+ // GFX11: v_fma_f16 v5.l , s105, s105, exec_lo ; encoding: [0x05,0x00,0x48,0xd6,0x69,0xd2,0xf8,0x01]
2188
2188
2189
- v_fma_f16 v5, vcc_lo, ttmp15, v3
2190
- // GFX11: v_fma_f16 v5, vcc_lo, ttmp15, v3 ; encoding: [0x05,0x00,0x48,0xd6,0x6a,0xf6,0x0c,0x04]
2189
+ v_fma_f16 v5.l , vcc_lo, ttmp15, v3.l
2190
+ // GFX11: v_fma_f16 v5.l , vcc_lo, ttmp15, v3.l ; encoding: [0x05,0x00,0x48,0xd6,0x6a,0xf6,0x0c,0x04]
2191
2191
2192
- v_fma_f16 v5, vcc_hi, 0xfe0b, v255
2193
- // GFX11: v_fma_f16 v5, vcc_hi, 0xfe0b, v255 ; encoding: [0x05,0x00,0x48,0xd6,0x6b,0xfe,0xfd,0x07,0x0b,0xfe,0x00,0x00]
2192
+ v_fma_f16 v5.l , vcc_hi, 0xfe0b, v255.l
2193
+ // GFX11: v_fma_f16 v5.l , vcc_hi, 0xfe0b, v255.l ; encoding: [0x05,0x00,0x48,0xd6,0x6b,0xfe,0xfd,0x07,0x0b,0xfe,0x00,0x00]
2194
2194
2195
- v_fma_f16 v5, -|ttmp15|, -|src_scc|, -|ttmp15|
2196
- // GFX11: v_fma_f16 v5, -|ttmp15|, -|src_scc|, -|ttmp15| ; encoding: [0x05,0x07,0x48,0xd6,0x7b,0xfa,0xed,0xe1]
2195
+ v_fma_f16 v5.l , -|ttmp15|, -|src_scc|, -|ttmp15|
2196
+ // GFX11: v_fma_f16 v5.l , -|ttmp15|, -|src_scc|, -|ttmp15| ; encoding: [0x05,0x07,0x48,0xd6,0x7b,0xfa,0xed,0xe1]
2197
2197
2198
- v_fma_f16 v5, m0, 0 .5 , m0
2199
- // GFX11: v_fma_f16 v5, m0, 0 .5 , m0 ; encoding: [0x05,0x00,0x48,0xd6,0x7d,0xe0,0xf5,0x01]
2198
+ v_fma_f16 v5.l , m0, 0 .5 , m0
2199
+ // GFX11: v_fma_f16 v5.l , m0, 0 .5 , m0 ; encoding: [0x05,0x00,0x48,0xd6,0x7d,0xe0,0xf5,0x01]
2200
2200
2201
- v_fma_f16 v5, |exec_lo|, -1 , vcc_hi
2202
- // GFX11: v_fma_f16 v5, |exec_lo|, -1 , vcc_hi ; encoding: [0x05,0x01,0x48,0xd6,0x7e,0x82,0xad,0x01]
2201
+ v_fma_f16 v5.l , |exec_lo|, -1 , vcc_hi
2202
+ // GFX11: v_fma_f16 v5.l , |exec_lo|, -1 , vcc_hi ; encoding: [0x05,0x01,0x48,0xd6,0x7e,0x82,0xad,0x01]
2203
2203
2204
- v_fma_f16 v5, -|exec_hi|, null, -|vcc_lo| op_sel:[1 ,1 ,1 ,1 ]
2205
- // GFX11: v_fma_f16 v5, -|exec_hi|, null, -|vcc_lo| op_sel:[1 ,1 ,1 ,1 ] ; encoding: [0x05,0x7d,0x48,0xd6,0x7f,0xf8,0xa8,0xa1]
2204
+ v_fma_f16 v5.h , -|exec_hi|, null, -|vcc_lo| op_sel:[1 ,1 ,1 ,1 ]
2205
+ // GFX11: v_fma_f16 v5.h , -|exec_hi|, null, -|vcc_lo| op_sel:[1 ,1 ,1 ,1 ] ; encoding: [0x05,0x7d,0x48,0xd6,0x7f,0xf8,0xa8,0xa1]
2206
2206
2207
- v_fma_f16 v5, null, exec_lo, -|0xfe0b| op_sel:[ 0 , 0 , 0 , 0 ]
2208
- // GFX11: v_fma_f16 v5, null, exec_lo, -|0xfe0b| ; encoding: [0x05,0x04,0x48,0xd6,0x7c,0xfc,0xfc,0x83,0x0b,0xfe,0x00,0x00]
2207
+ v_fma_f16 v5.l , null, exec_lo, -|0xfe0b|
2208
+ // GFX11: v_fma_f16 v5.l , null, exec_lo, -|0xfe0b| ; encoding: [0x05,0x04,0x48,0xd6,0x7c,0xfc,0xfc,0x83,0x0b,0xfe,0x00,0x00]
2209
2209
2210
- v_fma_f16 v5, -1 , -|exec_hi|, -|src_scc| op_sel:[1 ,0 ,0 ,0 ]
2211
- // GFX11: v_fma_f16 v5, -1 , -|exec_hi|, -|src_scc| op_sel:[1 ,0 ,0 ,0 ] ; encoding: [0x05,0x0e,0x48,0xd6,0xc1,0xfe,0xf4,0xc3]
2210
+ v_fma_f16 v5.l , -1 , -|exec_hi|, -|src_scc| op_sel:[1 ,0 ,0 ,0 ]
2211
+ // GFX11: v_fma_f16 v5.l , -1 , -|exec_hi|, -|src_scc| op_sel:[1 ,0 ,0 ,0 ] ; encoding: [0x05,0x0e,0x48,0xd6,0xc1,0xfe,0xf4,0xc3]
2212
2212
2213
- v_fma_f16 v5, 0 .5 , -m0, 0 .5 op_sel:[0 ,1 ,0 ,0 ]
2214
- // GFX11: v_fma_f16 v5, 0 .5 , -m0, 0 .5 op_sel:[0 ,1 ,0 ,0 ] ; encoding: [0x05,0x10,0x48,0xd6,0xf0,0xfa,0xc0,0x43]
2213
+ v_fma_f16 v5.l , 0 .5 , -m0, 0 .5 op_sel:[0 ,1 ,0 ,0 ]
2214
+ // GFX11: v_fma_f16 v5.l , 0 .5 , -m0, 0 .5 op_sel:[0 ,1 ,0 ,0 ] ; encoding: [0x05,0x10,0x48,0xd6,0xf0,0xfa,0xc0,0x43]
2215
2215
2216
- v_fma_f16 v5, -src_scc, |vcc_lo|, -1 op_sel:[0 ,0 ,1 ,0 ]
2217
- // GFX11: v_fma_f16 v5, -src_scc, |vcc_lo|, -1 op_sel:[0 ,0 ,1 ,0 ] ; encoding: [0x05,0x22,0x48,0xd6,0xfd,0xd4,0x04,0x23]
2216
+ v_fma_f16 v5.l , -src_scc, |vcc_lo|, -1 op_sel:[0 ,0 ,1 ,0 ]
2217
+ // GFX11: v_fma_f16 v5.l , -src_scc, |vcc_lo|, -1 op_sel:[0 ,0 ,1 ,0 ] ; encoding: [0x05,0x22,0x48,0xd6,0xfd,0xd4,0x04,0x23]
2218
2218
2219
- v_fma_f16 v255, -|0xfe0b|, -|vcc_hi|, null op_sel:[ 0 , 0 , 0 , 1 ] clamp
2220
- // GFX11: v_fma_f16 v255, -|0xfe0b|, -|vcc_hi|, null op_sel:[0 ,0 ,0 ,1 ] clamp ; encoding: [0xff,0xc3,0x48,0xd6,0xff,0xd6,0xf0,0x61,0x0b,0xfe,0x00,0x00]
2219
+ v_fma_f16 v255.h , -|0xfe0b|, -|vcc_hi|, null clamp
2220
+ // GFX11: v_fma_f16 v255.h , -|0xfe0b|, -|vcc_hi|, null op_sel:[0 ,0 ,0 ,1 ] clamp ; encoding: [0xff,0xc3,0x48,0xd6,0xff,0xd6,0xf0,0x61,0x0b,0xfe,0x00,0x00]
2221
2221
2222
- v_fma_f16 v255, -|0xfe0b|, -|vcc_hi|, null op_sel:[0 ,0 ,0 ,1 ] clamp div:2
2223
- // GFX11: v_fma_f16 v255, -|0xfe0b|, -|vcc_hi|, null op_sel:[0 ,0 ,0 ,1 ] clamp div:2 ; encoding: [0xff,0xc3,0x48,0xd6,0xff,0xd6,0xf0,0x79,0x0b,0xfe,0x00,0x00]
2222
+ v_fma_f16 v255.h, -|0xfe0b|, -|vcc_hi|, null op_sel:[0 ,0 ,0 ,1 ] clamp div:2
2223
+ // GFX11: v_fma_f16 v255.h, -|0xfe0b|, -|vcc_hi|, null op_sel:[0 ,0 ,0 ,1 ] clamp div:2 ; encoding: [0xff,0xc3,0x48,0xd6,0xff,0xd6,0xf0,0x79,0x0b,0xfe,0x00,0x00]
2224
+
2225
+ v_fma_f16 v5.l, v255.h, s2, s105
2226
+ // GFX11: v_fma_f16 v5.l, v255.h, s2, s105 op_sel:[1 ,0 ,0 ,0 ] ; encoding: [0x05,0x08,0x48,0xd6,0xff,0x05,0xa4,0x01]
2227
+
2228
+ v_fma_f16 v5.l, s1, v255.h, exec_hi
2229
+ // GFX11: v_fma_f16 v5.l, s1, v255.h, exec_hi op_sel:[0 ,1 ,0 ,0 ] ; encoding: [0x05,0x10,0x48,0xd6,0x01,0xfe,0xff,0x01]
2230
+
2231
+ v_fma_f16 v5.l, vcc_hi, 0xfe0b, v255.h
2232
+ // GFX11: v_fma_f16 v5.l, vcc_hi, 0xfe0b, v255.h op_sel:[0 ,0 ,1 ,0 ] ; encoding: [0x05,0x20,0x48,0xd6,0x6b,0xfe,0xfd,0x07,0x0b,0xfe,0x00,0x00]
2233
+
2234
+ v_fma_f16 v5.l, -|exec_hi|, null, -|vcc_lo|
2235
+ // GFX11: v_fma_f16 v5.l, -|exec_hi|, null, -|vcc_lo| ; encoding: [0x05,0x05,0x48,0xd6,0x7f,0xf8,0xa8,0xa1]
2236
+
2237
+ v_fma_f16 v5.l, -1 , -|exec_hi|, -|src_scc|
2238
+ // GFX11: v_fma_f16 v5.l, -1 , -|exec_hi|, -|src_scc| ; encoding: [0x05,0x06,0x48,0xd6,0xc1,0xfe,0xf4,0xc3]
2239
+
2240
+ v_fma_f16 v5.l, 0 .5 , -m0, 0 .5
2241
+ // GFX11: v_fma_f16 v5.l, 0 .5 , -m0, 0 .5 ; encoding: [0x05,0x00,0x48,0xd6,0xf0,0xfa,0xc0,0x43]
2242
+
2243
+ v_fma_f16 v5.l, -src_scc, |vcc_lo|, -1
2244
+ // GFX11: v_fma_f16 v5.l, -src_scc, |vcc_lo|, -1 ; encoding: [0x05,0x02,0x48,0xd6,0xfd,0xd4,0x04,0x23]
2245
+
2246
+ v_fma_f16 v255.l, -|0xfe0b|, -|vcc_hi|, null clamp div:2
2247
+ // GFX11: v_fma_f16 v255.l, -|0xfe0b|, -|vcc_hi|, null clamp div:2 ; encoding: [0xff,0x83,0x48,0xd6,0xff,0xd6,0xf0,0x79,0x0b,0xfe,0x00,0x00]
2248
+
2249
+ v_fma_f16 v5.l, v255.h, s2, s105
2250
+ // GFX11: [0x05,0x08,0x48,0xd6,0xff,0x05,0xa4,0x01]
2251
+
2252
+ v_fma_f16 v5.l, s1, v255.h, exec_hi
2253
+ // GFX11: [0x05,0x10,0x48,0xd6,0x01,0xfe,0xff,0x01]
2254
+
2255
+ v_fma_f16 v5.l, vcc_hi, 0xfe0b, v255.h
2256
+ // GFX11: [0x05,0x20,0x48,0xd6,0x6b,0xfe,0xfd,0x07,0x0b,0xfe,0x00,0x00]
2257
+
2258
+ v_fma_f16 v255.h, -|0xfe0b|, -|vcc_hi|, null clamp
2259
+ // GFX11: [0xff,0xc3,0x48,0xd6,0xff,0xd6,0xf0,0x61,0x0b,0xfe,0x00,0x00]
2224
2260
2225
2261
v_fma_f32 v5, v1, v2, s3
2226
2262
// GFX11: v_fma_f32 v5, v1, v2, s3 ; encoding: [0x05,0x00,0x13,0xd6,0x01,0x05,0x0e,0x00]
0 commit comments