@@ -94,6 +94,18 @@ v_ceil_f16 v5.l, src_scc
94
94
v_ceil_f16 v127.l, 0xfe0b
95
95
// GFX12: v_ceil_f16_e32 v127.l, 0xfe0b ; encoding: [0xff,0xb8,0xfe,0x7e,0x0b,0xfe,0x00,0x00]
96
96
97
+ v_ceil_f16 v5.l, v1.h
98
+ // GFX12: v_ceil_f16_e32 v5.l, v1.h ; encoding: [0x81,0xb9,0x0a,0x7e]
99
+
100
+ v_ceil_f16 v5.l, v127.h
101
+ // GFX12: v_ceil_f16_e32 v5.l, v127.h ; encoding: [0xff,0xb9,0x0a,0x7e]
102
+
103
+ v_ceil_f16 v5.h, src_scc
104
+ // GFX12: v_ceil_f16_e32 v5.h, src_scc ; encoding: [0xfd,0xb8,0x0a,0x7f]
105
+
106
+ v_ceil_f16 v127.h, 0xfe0b
107
+ // GFX12: v_ceil_f16_e32 v127.h, 0xfe0b ; encoding: [0xff,0xb8,0xfe,0x7f,0x0b,0xfe,0x00,0x00]
108
+
97
109
v_ceil_f32 v5, v1
98
110
// GFX12: v_ceil_f32_e32 v5, v1 ; encoding: [0x01,0x45,0x0a,0x7e]
99
111
@@ -1886,6 +1898,18 @@ v_exp_f16 v5.l, src_scc
1886
1898
v_exp_f16 v127.l, 0xfe0b
1887
1899
// GFX12: v_exp_f16_e32 v127.l, 0xfe0b ; encoding: [0xff,0xb0,0xfe,0x7e,0x0b,0xfe,0x00,0x00]
1888
1900
1901
+ v_exp_f16 v5.l, v1.h
1902
+ // GFX12: v_exp_f16_e32 v5.l, v1.h ; encoding: [0x81,0xb1,0x0a,0x7e]
1903
+
1904
+ v_exp_f16 v5.l, v127.h
1905
+ // GFX12: v_exp_f16_e32 v5.l, v127.h ; encoding: [0xff,0xb1,0x0a,0x7e]
1906
+
1907
+ v_exp_f16 v5.h, src_scc
1908
+ // GFX12: v_exp_f16_e32 v5.h, src_scc ; encoding: [0xfd,0xb0,0x0a,0x7f]
1909
+
1910
+ v_exp_f16 v127.h, 0xfe0b
1911
+ // GFX12: v_exp_f16_e32 v127.h, 0xfe0b ; encoding: [0xff,0xb0,0xfe,0x7f,0x0b,0xfe,0x00,0x00]
1912
+
1889
1913
v_exp_f32 v5, v1
1890
1914
// GFX12: v_exp_f32_e32 v5, v1 ; encoding: [0x01,0x4b,0x0a,0x7e]
1891
1915
@@ -2111,6 +2135,18 @@ v_floor_f16 v5.l, src_scc
2111
2135
v_floor_f16 v127.l, 0xfe0b
2112
2136
// GFX12: v_floor_f16_e32 v127.l, 0xfe0b ; encoding: [0xff,0xb6,0xfe,0x7e,0x0b,0xfe,0x00,0x00]
2113
2137
2138
+ v_floor_f16 v5.l, v1.h
2139
+ // GFX12: v_floor_f16_e32 v5.l, v1.h ; encoding: [0x81,0xb7,0x0a,0x7e]
2140
+
2141
+ v_floor_f16 v5.l, v127.h
2142
+ // GFX12: v_floor_f16_e32 v5.l, v127.h ; encoding: [0xff,0xb7,0x0a,0x7e]
2143
+
2144
+ v_floor_f16 v5.h, src_scc
2145
+ // GFX12: v_floor_f16_e32 v5.h, src_scc ; encoding: [0xfd,0xb6,0x0a,0x7f]
2146
+
2147
+ v_floor_f16 v127.h, 0xfe0b
2148
+ // GFX12: v_floor_f16_e32 v127.h, 0xfe0b ; encoding: [0xff,0xb6,0xfe,0x7f,0x0b,0xfe,0x00,0x00]
2149
+
2114
2150
v_floor_f32 v5, v1
2115
2151
// GFX12: v_floor_f32_e32 v5, v1 ; encoding: [0x01,0x49,0x0a,0x7e]
2116
2152
@@ -2651,6 +2687,18 @@ v_log_f16 v5.l, src_scc
2651
2687
v_log_f16 v127.l, 0xfe0b
2652
2688
// GFX12: v_log_f16_e32 v127.l, 0xfe0b ; encoding: [0xff,0xae,0xfe,0x7e,0x0b,0xfe,0x00,0x00]
2653
2689
2690
+ v_log_f16 v5.l, v1.h
2691
+ // GFX12: v_log_f16_e32 v5.l, v1.h ; encoding: [0x81,0xaf,0x0a,0x7e]
2692
+
2693
+ v_log_f16 v5.l, v127.h
2694
+ // GFX12: v_log_f16_e32 v5.l, v127.h ; encoding: [0xff,0xaf,0x0a,0x7e]
2695
+
2696
+ v_log_f16 v5.h, src_scc
2697
+ // GFX12: v_log_f16_e32 v5.h, src_scc ; encoding: [0xfd,0xae,0x0a,0x7f]
2698
+
2699
+ v_log_f16 v127.h, 0xfe0b
2700
+ // GFX12: v_log_f16_e32 v127.h, 0xfe0b ; encoding: [0xff,0xae,0xfe,0x7f,0x0b,0xfe,0x00,0x00]
2701
+
2654
2702
v_log_f32 v5, v1
2655
2703
// GFX12: v_log_f32_e32 v5, v1 ; encoding: [0x01,0x4f,0x0a,0x7e]
2656
2704
@@ -2995,6 +3043,18 @@ v_rcp_f16 v5.l, src_scc
2995
3043
v_rcp_f16 v127.l, 0xfe0b
2996
3044
// GFX12: v_rcp_f16_e32 v127.l, 0xfe0b ; encoding: [0xff,0xa8,0xfe,0x7e,0x0b,0xfe,0x00,0x00]
2997
3045
3046
+ v_rcp_f16 v5.l, v1.h
3047
+ // GFX12: v_rcp_f16_e32 v5.l, v1.h ; encoding: [0x81,0xa9,0x0a,0x7e]
3048
+
3049
+ v_rcp_f16 v5.l, v127.h
3050
+ // GFX12: v_rcp_f16_e32 v5.l, v127.h ; encoding: [0xff,0xa9,0x0a,0x7e]
3051
+
3052
+ v_rcp_f16 v5.h, src_scc
3053
+ // GFX12: v_rcp_f16_e32 v5.h, src_scc ; encoding: [0xfd,0xa8,0x0a,0x7f]
3054
+
3055
+ v_rcp_f16 v127.h, 0xfe0b
3056
+ // GFX12: v_rcp_f16_e32 v127.h, 0xfe0b ; encoding: [0xff,0xa8,0xfe,0x7f,0x0b,0xfe,0x00,0x00]
3057
+
2998
3058
v_rcp_f32 v5, v1
2999
3059
// GFX12: v_rcp_f32_e32 v5, v1 ; encoding: [0x01,0x55,0x0a,0x7e]
3000
3060
@@ -3322,6 +3382,18 @@ v_rsq_f16 v5.l, src_scc
3322
3382
v_rsq_f16 v127.l, 0xfe0b
3323
3383
// GFX12: v_rsq_f16_e32 v127.l, 0xfe0b ; encoding: [0xff,0xac,0xfe,0x7e,0x0b,0xfe,0x00,0x00]
3324
3384
3385
+ v_rsq_f16 v5.l, v1.h
3386
+ // GFX12: v_rsq_f16_e32 v5.l, v1.h ; encoding: [0x81,0xad,0x0a,0x7e]
3387
+
3388
+ v_rsq_f16 v5.l, v127.h
3389
+ // GFX12: v_rsq_f16_e32 v5.l, v127.h ; encoding: [0xff,0xad,0x0a,0x7e]
3390
+
3391
+ v_rsq_f16 v5.h, src_scc
3392
+ // GFX12: v_rsq_f16_e32 v5.h, src_scc ; encoding: [0xfd,0xac,0x0a,0x7f]
3393
+
3394
+ v_rsq_f16 v127.h, 0xfe0b
3395
+ // GFX12: v_rsq_f16_e32 v127.h, 0xfe0b ; encoding: [0xff,0xac,0xfe,0x7f,0x0b,0xfe,0x00,0x00]
3396
+
3325
3397
v_rsq_f32 v5, v1
3326
3398
// GFX12: v_rsq_f32_e32 v5, v1 ; encoding: [0x01,0x5d,0x0a,0x7e]
3327
3399
@@ -3616,6 +3688,18 @@ v_sqrt_f16 v5.l, src_scc
3616
3688
v_sqrt_f16 v127.l, 0xfe0b
3617
3689
// GFX12: v_sqrt_f16_e32 v127.l, 0xfe0b ; encoding: [0xff,0xaa,0xfe,0x7e,0x0b,0xfe,0x00,0x00]
3618
3690
3691
+ v_sqrt_f16 v5.l, v1.h
3692
+ // GFX12: v_sqrt_f16_e32 v5.l, v1.h ; encoding: [0x81,0xab,0x0a,0x7e]
3693
+
3694
+ v_sqrt_f16 v5.l, v127.h
3695
+ // GFX12: v_sqrt_f16_e32 v5.l, v127.h ; encoding: [0xff,0xab,0x0a,0x7e]
3696
+
3697
+ v_sqrt_f16 v5.h, src_scc
3698
+ // GFX12: v_sqrt_f16_e32 v5.h, src_scc ; encoding: [0xfd,0xaa,0x0a,0x7f]
3699
+
3700
+ v_sqrt_f16 v127.h, 0xfe0b
3701
+ // GFX12: v_sqrt_f16_e32 v127.h, 0xfe0b ; encoding: [0xff,0xaa,0xfe,0x7f,0x0b,0xfe,0x00,0x00]
3702
+
3619
3703
v_sqrt_f32 v5, v1
3620
3704
// GFX12: v_sqrt_f32_e32 v5, v1 ; encoding: [0x01,0x67,0x0a,0x7e]
3621
3705
0 commit comments