@@ -2119,104 +2119,116 @@ v_div_scale_f64 v[254:255], vcc, 0xaf123456, -vcc, -1 clamp div:2
2119
2119
// W64: encoding: [0xfe,0xea,0xfd,0xd6,0xff,0xd4,0x04,0x5b,0x56,0x34,0x12,0xaf]
2120
2120
// W32-ERR: :[[@LINE-2 ]]:{{[0-9 ]+}}: error: invalid operand for instruction
2121
2121
2122
- v_dot2_bf16_bf16 v5, v1, v2, s3
2122
+ v_dot2_bf16_bf16 v5.l , v1, v2, s3
2123
2123
// GFX11: encoding: [0x05,0x00,0x67,0xd6,0x01,0x05,0x0e,0x00]
2124
2124
2125
- v_dot2_bf16_bf16 v5, v255, v255, s105
2125
+ v_dot2_bf16_bf16 v5.l , v255, v255, s105
2126
2126
// GFX11: encoding: [0x05,0x00,0x67,0xd6,0xff,0xff,0xa7,0x01]
2127
2127
2128
- v_dot2_bf16_bf16 v5, s1, s2, v3
2128
+ v_dot2_bf16_bf16 v5.l , s1, s2, v3.l
2129
2129
// GFX11: encoding: [0x05,0x00,0x67,0xd6,0x01,0x04,0x0c,0x04]
2130
2130
2131
- v_dot2_bf16_bf16 v5, s105, s105, m0
2131
+ v_dot2_bf16_bf16 v5.l , s105, s105, m0
2132
2132
// GFX11: encoding: [0x05,0x00,0x67,0xd6,0x69,0xd2,0xf4,0x01]
2133
2133
2134
- v_dot2_bf16_bf16 v5, vcc_lo, ttmp15, v255
2135
- // GFX11: encoding: [0x05,0x00 ,0x67,0xd6,0x6a,0xf6,0xfc,0x07]
2134
+ v_dot2_bf16_bf16 v5.l , vcc_lo, ttmp15, v255.h
2135
+ // GFX11: encoding: [0x05,0x20 ,0x67,0xd6,0x6a,0xf6,0xfc,0x07]
2136
2136
2137
- v_dot2_bf16_bf16 v5, vcc_hi, 0xfe0b, vcc_hi
2137
+ v_dot2_bf16_bf16 v5.l , vcc_hi, 0xfe0b, vcc_hi
2138
2138
// GFX11: encoding: [0x05,0x00,0x67,0xd6,0x6b,0xfe,0xad,0x01,0x0b,0xfe,0x00,0x00]
2139
2139
2140
- v_dot2_bf16_bf16 v5, ttmp15, src_scc, ttmp15
2140
+ v_dot2_bf16_bf16 v5.l , ttmp15, src_scc, ttmp15
2141
2141
// GFX11: encoding: [0x05,0x00,0x67,0xd6,0x7b,0xfa,0xed,0x01]
2142
2142
2143
- v_dot2_bf16_bf16 v5, |m0|, -1 , -vcc_lo
2143
+ v_dot2_bf16_bf16 v5.l , |m0|, -1 , -vcc_lo
2144
2144
// GFX11: encoding: [0x05,0x01,0x67,0xd6,0x7d,0x82,0xa9,0x81]
2145
2145
2146
- v_dot2_bf16_bf16 v5, -|exec_lo|, null, -|0xfe0b|
2146
+ v_dot2_bf16_bf16 v5.l , -|exec_lo|, null, -|0xfe0b|
2147
2147
// GFX11: encoding: [0x05,0x05,0x67,0xd6,0x7e,0xf8,0xfc,0xa3,0x0b,0xfe,0x00,0x00]
2148
2148
2149
- v_dot2_bf16_bf16 v5, -|exec_hi|, -|exec_lo|, -|exec_lo|
2149
+ v_dot2_bf16_bf16 v5.l , -|exec_hi|, -|exec_lo|, -|exec_lo|
2150
2150
// GFX11: encoding: [0x05,0x07,0x67,0xd6,0x7f,0xfc,0xf8,0xe1]
2151
2151
2152
- v_dot2_bf16_bf16 v5, null, -exec_hi, |src_scc|
2152
+ v_dot2_bf16_bf16 v5.l , null, -exec_hi, |src_scc|
2153
2153
// GFX11: encoding: [0x05,0x04,0x67,0xd6,0x7c,0xfe,0xf4,0x43]
2154
2154
2155
- v_dot2_bf16_bf16 v5, -1 , -|m0|, -|exec_hi| op_sel:[ 0 , 0 , 0 , 0 ]
2155
+ v_dot2_bf16_bf16 v5.l , -1 , -|m0|, -|exec_hi|
2156
2156
// GFX11: encoding: [0x05,0x06,0x67,0xd6,0xc1,0xfa,0xfc,0xc1]
2157
2157
2158
- v_dot2_bf16_bf16 v5, -src_scc, |vcc_lo|, -1 op_sel:[ 0 , 0 , 1 , 0 ]
2159
- // GFX11: encoding: [0x05,0x22 ,0x67,0xd6,0xfd,0xd4,0x04,0x23]
2158
+ v_dot2_bf16_bf16 v5.l , -src_scc, |vcc_lo|, -1
2159
+ // GFX11: encoding: [0x05,0x02 ,0x67,0xd6,0xfd,0xd4,0x04,0x23]
2160
2160
2161
- v_dot2_bf16_bf16 v255, -|0xfe0b|, -|vcc_hi|, null op_sel:[ 0 , 0 , 0 , 1 ]
2161
+ v_dot2_bf16_bf16 v255.h , -|0xfe0b|, -|vcc_hi|, null
2162
2162
// GFX11: encoding: [0xff,0x43,0x67,0xd6,0xff,0xd6,0xf0,0x61,0x0b,0xfe,0x00,0x00]
2163
2163
2164
- v_dot2_bf16_bf16 v2, v0, 0x20004000, v2
2165
- // GFX11: v_dot2_bf16_bf16 v2, v0, 0x20004000, v2 ; encoding: [0x02,0x00,0x67,0xd6,0x00,0xff,0x09,0x04,0x00,0x40,0x00,0x20]
2164
+ v_dot2_bf16_bf16 v2.l , v0, 0x20004000, v2.l
2165
+ // GFX11: encoding: [0x02,0x00,0x67,0xd6,0x00,0xff,0x09,0x04,0x00,0x40,0x00,0x20]
2166
2166
2167
- v_dot2_bf16_bf16 v2, 0x20004000, v0, v2
2168
- // GFX11: v_dot2_bf16_bf16 v2, 0x20004000, v0, v2 ; encoding: [0x02,0x00,0x67,0xd6,0xff,0x00,0x0a,0x04,0x00,0x40,0x00,0x20]
2167
+ v_dot2_bf16_bf16 v2.l , 0x20004000, v0, v2.l
2168
+ // GFX11: encoding: [0x02,0x00,0x67,0xd6,0xff,0x00,0x0a,0x04,0x00,0x40,0x00,0x20]
2169
2169
2170
- v_dot2_f16_f16 v5, v1, v2, s3
2170
+ v_dot2_bf16_bf16 v5.l, vcc_lo, ttmp15, v255.h
2171
+ // GFX11: encoding: [0x05,0x20,0x67,0xd6,0x6a,0xf6,0xfc,0x07]
2172
+
2173
+ v_dot2_bf16_bf16 v255.h, -|0xfe0b|, -|vcc_hi|, null
2174
+ // GFX11: encoding: [0xff,0x43,0x67,0xd6,0xff,0xd6,0xf0,0x61,0x0b,0xfe,0x00,0x00]
2175
+
2176
+ v_dot2_f16_f16 v5.l, v1, v2, s3
2171
2177
// GFX11: encoding: [0x05,0x00,0x66,0xd6,0x01,0x05,0x0e,0x00]
2172
2178
2173
- v_dot2_f16_f16 v5, v255, s2, s105
2179
+ v_dot2_f16_f16 v5.l , v255, s2, s105
2174
2180
// GFX11: encoding: [0x05,0x00,0x66,0xd6,0xff,0x05,0xa4,0x01]
2175
2181
2176
- v_dot2_f16_f16 v5, s1, v255, exec_hi
2182
+ v_dot2_f16_f16 v5.l , s1, v255, exec_hi
2177
2183
// GFX11: encoding: [0x05,0x00,0x66,0xd6,0x01,0xfe,0xff,0x01]
2178
2184
2179
- v_dot2_f16_f16 v5, s105, s105, exec_lo
2185
+ v_dot2_f16_f16 v5.l , s105, s105, exec_lo
2180
2186
// GFX11: encoding: [0x05,0x00,0x66,0xd6,0x69,0xd2,0xf8,0x01]
2181
2187
2182
- v_dot2_f16_f16 v5, vcc_lo, ttmp15, v3
2188
+ v_dot2_f16_f16 v5.l , vcc_lo, ttmp15, v3.l
2183
2189
// GFX11: encoding: [0x05,0x00,0x66,0xd6,0x6a,0xf6,0x0c,0x04]
2184
2190
2185
- v_dot2_f16_f16 v5, vcc_hi, 0xfe0b, v255
2186
- // GFX11: encoding: [0x05,0x00 ,0x66,0xd6,0x6b,0xfe,0xfd,0x07,0x0b,0xfe,0x00,0x00]
2191
+ v_dot2_f16_f16 v5.l , vcc_hi, 0xfe0b, v255.h
2192
+ // GFX11: encoding: [0x05,0x20 ,0x66,0xd6,0x6b,0xfe,0xfd,0x07,0x0b,0xfe,0x00,0x00]
2187
2193
2188
- v_dot2_f16_f16 v5, -|ttmp15|, -|src_scc|, -|ttmp15|
2194
+ v_dot2_f16_f16 v5.l , -|ttmp15|, -|src_scc|, -|ttmp15|
2189
2195
// GFX11: encoding: [0x05,0x07,0x66,0xd6,0x7b,0xfa,0xed,0xe1]
2190
2196
2191
- v_dot2_f16_f16 v5, m0, 0 .5 , m0
2197
+ v_dot2_f16_f16 v5.l , m0, 0 .5 , m0
2192
2198
// GFX11: encoding: [0x05,0x00,0x66,0xd6,0x7d,0xe0,0xf5,0x01]
2193
2199
2194
- v_dot2_f16_f16 v5, |exec_lo|, -1 , vcc_hi
2200
+ v_dot2_f16_f16 v5.l , |exec_lo|, -1 , vcc_hi
2195
2201
// GFX11: encoding: [0x05,0x01,0x66,0xd6,0x7e,0x82,0xad,0x01]
2196
2202
2197
- v_dot2_f16_f16 v5, -|exec_hi|, null, -|vcc_lo|
2203
+ v_dot2_f16_f16 v5.l , -|exec_hi|, null, -|vcc_lo|
2198
2204
// GFX11: encoding: [0x05,0x05,0x66,0xd6,0x7f,0xf8,0xa8,0xa1]
2199
2205
2200
- v_dot2_f16_f16 v5, null, exec_lo, -|0xfe0b|
2206
+ v_dot2_f16_f16 v5.l , null, exec_lo, -|0xfe0b|
2201
2207
// GFX11: encoding: [0x05,0x04,0x66,0xd6,0x7c,0xfc,0xfc,0x83,0x0b,0xfe,0x00,0x00]
2202
2208
2203
- v_dot2_f16_f16 v5, -1 , -|exec_hi|, -|src_scc|
2209
+ v_dot2_f16_f16 v5.l , -1 , -|exec_hi|, -|src_scc|
2204
2210
// GFX11: encoding: [0x05,0x06,0x66,0xd6,0xc1,0xfe,0xf4,0xc3]
2205
2211
2206
- v_dot2_f16_f16 v5, 0 .5 , -m0, 0 .5 op_sel:[ 0 , 0 , 0 , 0 ]
2212
+ v_dot2_f16_f16 v5.l , 0 .5 , -m0, 0 .5
2207
2213
// GFX11: encoding: [0x05,0x00,0x66,0xd6,0xf0,0xfa,0xc0,0x43]
2208
2214
2209
- v_dot2_f16_f16 v5, -src_scc, |vcc_lo|, -1 op_sel:[0 ,0 ,1 ,0 ]
2215
+ v_dot2_f16_f16 v5.l , -src_scc, |vcc_lo|, -1 op_sel:[0 ,0 ,1 ,0 ]
2210
2216
// GFX11: encoding: [0x05,0x22,0x66,0xd6,0xfd,0xd4,0x04,0x23]
2211
2217
2212
- v_dot2_f16_f16 v255, -|0xfe0b|, -|vcc_hi|, null op_sel:[ 0 , 0 , 0 , 1 ]
2218
+ v_dot2_f16_f16 v255.h , -|0xfe0b|, -|vcc_hi|, null
2213
2219
// GFX11: encoding: [0xff,0x43,0x66,0xd6,0xff,0xd6,0xf0,0x61,0x0b,0xfe,0x00,0x00]
2214
2220
2215
- v_dot2_f16_f16 v2, v0, 0x20004000, v2
2216
- // GFX11: v_dot2_f16_f16 v2, v0, 0x20004000, v2 ; encoding: [0x02,0x00,0x66,0xd6,0x00,0xff,0x09,0x04,0x00,0x40,0x00,0x20]
2221
+ v_dot2_f16_f16 v2.l , v0, 0x20004000, v2.l
2222
+ // GFX11: encoding: [0x02,0x00,0x66,0xd6,0x00,0xff,0x09,0x04,0x00,0x40,0x00,0x20]
2217
2223
2218
- v_dot2_f16_f16 v2, 0x20004000, v0, v2
2219
- // GFX11: v_dot2_f16_f16 v2, 0x20004000, v0, v2 ; encoding: [0x02,0x00,0x66,0xd6,0xff,0x00,0x0a,0x04,0x00,0x40,0x00,0x20]
2224
+ v_dot2_f16_f16 v2.l, 0x20004000, v0, v2.l
2225
+ // GFX11: encoding: [0x02,0x00,0x66,0xd6,0xff,0x00,0x0a,0x04,0x00,0x40,0x00,0x20]
2226
+
2227
+ v_dot2_f16_f16 v5.l, vcc_hi, 0xfe0b, v255.h
2228
+ // GFX11: encoding: [0x05,0x20,0x66,0xd6,0x6b,0xfe,0xfd,0x07,0x0b,0xfe,0x00,0x00]
2229
+
2230
+ v_dot2_f16_f16 v255.h, -|0xfe0b|, -|vcc_hi|, null
2231
+ // GFX11: encoding: [0xff,0x43,0x66,0xd6,0xff,0xd6,0xf0,0x61,0x0b,0xfe,0x00,0x00]
2220
2232
2221
2233
v_fma_dx9_zero_f32 v5, v1, v2, s3
2222
2234
// GFX11: encoding: [0x05,0x00,0x09,0xd6,0x01,0x05,0x0e,0x00]
0 commit comments