llvm
diff --git a/‎llvm/docs/AMDGPUModifierSyntax.rst
Lines changed: 3 additions & 1 deletion b/‎llvm/docs/AMDGPUModifierSyntax.rst
Lines changed: 3 additions & 1 deletion
diff --git a/‎llvm/lib/Target/AMDGPU/AsmParser/AMDGPUAsmParser.cpp
Lines changed: 9 additions & 8 deletions b/‎llvm/lib/Target/AMDGPU/AsmParser/AMDGPUAsmParser.cpp
Lines changed: 9 additions & 8 deletions
diff --git a/‎llvm/lib/Target/AMDGPU/SIInstrInfo.td
Lines changed: 2 additions & 1 deletion b/‎llvm/lib/Target/AMDGPU/SIInstrInfo.td
Lines changed: 2 additions & 1 deletion
diff --git a/‎llvm/test/MC/AMDGPU/gfx11_asm_vop1_dpp16.s
Lines changed: 67 additions & 67 deletions b/‎llvm/test/MC/AMDGPU/gfx11_asm_vop1_dpp16.s
Lines changed: 67 additions & 67 deletions
diff --git a/‎llvm/test/MC/AMDGPU/gfx11_asm_vop2_dpp16.s
Lines changed: 53 additions & 53 deletions b/‎llvm/test/MC/AMDGPU/gfx11_asm_vop2_dpp16.s
Lines changed: 53 additions & 53 deletions
diff --git a/‎llvm/test/MC/AMDGPU/gfx11_asm_vop3_dpp16.s
Lines changed: 98 additions & 98 deletions b/‎llvm/test/MC/AMDGPU/gfx11_asm_vop3_dpp16.s
Lines changed: 98 additions & 98 deletions
diff --git a/‎llvm/test/MC/AMDGPU/gfx11_asm_vop3_dpp16_from_vop1.s
Lines changed: 67 additions & 67 deletions b/‎llvm/test/MC/AMDGPU/gfx11_asm_vop3_dpp16_from_vop1.s
Lines changed: 67 additions & 67 deletions
diff --git a/‎llvm/test/MC/AMDGPU/gfx11_asm_vop3_dpp16_from_vop2.s
Lines changed: 41 additions & 41 deletions b/‎llvm/test/MC/AMDGPU/gfx11_asm_vop3_dpp16_from_vop2.s
Lines changed: 41 additions & 41 deletions
diff --git a/‎llvm/test/MC/AMDGPU/gfx11_asm_vop3_dpp16_from_vopc.s
Lines changed: 64 additions & 64 deletions b/‎llvm/test/MC/AMDGPU/gfx11_asm_vop3_dpp16_from_vopc.s
Lines changed: 64 additions & 64 deletions
diff --git a/‎llvm/test/MC/AMDGPU/gfx11_asm_vop3_dpp16_from_vopcx.s
Lines changed: 64 additions & 64 deletions b/‎llvm/test/MC/AMDGPU/gfx11_asm_vop3_dpp16_from_vopcx.s
Lines changed: 64 additions & 64 deletions
diff --git a/‎llvm/test/MC/AMDGPU/gfx11_asm_vop3p_dpp16.s
Lines changed: 2 additions & 2 deletions b/‎llvm/test/MC/AMDGPU/gfx11_asm_vop3p_dpp16.s
Lines changed: 2 additions & 2 deletions
@@ -1406,9 +1406,11 @@ invalid lanes is disabled.
 
                                              Accessing data from an invalid lane will
                                              return zero.
+
+    bound_ctrl:0 (GFX11+)                    Disables data sharing with invalid lanes.
     ======================================== ================================================
 
-.. WARNING:: For historical reasons, *bound_ctrl:0* has the same meaning as *bound_ctrl:1*.
+.. WARNING:: For historical reasons, *bound_ctrl:0* has the same meaning as *bound_ctrl:1* for older architectures.
 
 .. _amdgpu_synid_fi16:
 
 
@@ -1552,7 +1552,7 @@ class AMDGPUAsmParser : public MCTargetAsmParser {
   OperandMatchResultTy
   parseIntWithPrefix(const char *Prefix, OperandVector &Operands,
                      AMDGPUOperand::ImmTy ImmTy = AMDGPUOperand::ImmTyNone,
-                     bool (*ConvertResult)(int64_t &) = nullptr);
+                     std::function<bool(int64_t &)> ConvertResult = nullptr);
 
   OperandMatchResultTy
   parseOperandArrayWithPrefix(const char *Prefix,
@@ -1785,6 +1785,7 @@ class AMDGPUAsmParser : public MCTargetAsmParser {
 
   bool parseDimId(unsigned &Encoding);
   OperandMatchResultTy parseDim(OperandVector &Operands);
+  bool convertDppBoundCtrl(int64_t &BoundCtrl);
   OperandMatchResultTy parseDPP8(OperandVector &Operands);
   OperandMatchResultTy parseDPPCtrl(OperandVector &Operands);
   bool isSupportedDPPCtrl(StringRef Ctrl, const OperandVector &Operands);
@@ -5929,10 +5930,9 @@ AMDGPUAsmParser::parseIntWithPrefix(const char *Prefix, int64_t &IntVal) {
   return parseExpr(IntVal) ? MatchOperand_Success : MatchOperand_ParseFail;
 }
 
-OperandMatchResultTy
-AMDGPUAsmParser::parseIntWithPrefix(const char *Prefix, OperandVector &Operands,
-                                    AMDGPUOperand::ImmTy ImmTy,
-                                    bool (*ConvertResult)(int64_t&)) {
+OperandMatchResultTy AMDGPUAsmParser::parseIntWithPrefix(
+    const char *Prefix, OperandVector &Operands, AMDGPUOperand::ImmTy ImmTy,
+    std::function<bool(int64_t &)> ConvertResult) {
   SMLoc S = getLoc();
   int64_t Value = 0;
 
@@ -8011,12 +8011,13 @@ static bool ConvertOmodDiv(int64_t &Div) {
   return false;
 }
 
-// Both bound_ctrl:0 and bound_ctrl:1 are encoded as 1.
+// For pre-gfx11 targets, both bound_ctrl:0 and bound_ctrl:1 are encoded as 1.
 // This is intentional and ensures compatibility with sp3.
 // See bug 35397 for details.
-static bool ConvertDppBoundCtrl(int64_t &BoundCtrl) {
+bool AMDGPUAsmParser::convertDppBoundCtrl(int64_t &BoundCtrl) {
   if (BoundCtrl == 0 || BoundCtrl == 1) {
-    BoundCtrl = 1;
+    if (!isGFX11Plus())
+      BoundCtrl = 1;
     return true;
   }
   return false;
 
@@ -1273,7 +1273,8 @@ def dpp_ctrl : NamedOperandU32<"DPPCtrl", NamedMatchClass<"DPPCtrl", 0>>;
 
 def row_mask : NamedOperandU32<"RowMask", NamedMatchClass<"RowMask">>;
 def bank_mask : NamedOperandU32<"BankMask", NamedMatchClass<"BankMask">>;
-def bound_ctrl : NamedIntOperand<i1, "bound_ctrl", "DppBoundCtrl", "ConvertDppBoundCtrl">;
+def bound_ctrl : NamedIntOperand<i1, "bound_ctrl", "DppBoundCtrl",
+    "[this] (int64_t &BC) -> bool { return convertDppBoundCtrl(BC); }">;
 def FI : NamedOperandU32<"FI", NamedMatchClass<"FI">>;
 
 def blgp : NamedOperandU32<"BLGP", NamedMatchClass<"BLGP">>;
 
@@ -2,13 +2,13 @@
 // RUN: llvm-mc -arch=amdgcn -mcpu=gfx1100 -mattr=-wavefrontsize32,+wavefrontsize64 -show-encoding %s | FileCheck --check-prefixes=GFX11 %s
 
 v_dot2_f32_f16 v0, v1, v2, v3 neg_lo:[0,0,0] neg_hi:[0,0,0] quad_perm:[2,2,3,1] bound_ctrl:0 fi:1
-// GFX11: v_dot2_f32_f16_e64_dpp v0, v1, v2, v3 quad_perm:[2,2,3,1] row_mask:0xf bank_mask:0xf bound_ctrl:1 fi:1 ; encoding: [0x00,0x00,0x13,0xcc,0xfa,0x04,0x0e,0x04,0x01,0x7a,0x0c,0xff]
+// GFX11: v_dot2_f32_f16_e64_dpp v0, v1, v2, v3 quad_perm:[2,2,3,1] row_mask:0xf bank_mask:0xf fi:1 ; encoding: [0x00,0x00,0x13,0xcc,0xfa,0x04,0x0e,0x04,0x01,0x7a,0x04,0xff]
 
 v_dot2_f32_f16 v0, v1, v2, v3 neg_lo:[1,1,0] neg_hi:[1,0,1] quad_perm:[3,2,1,0] bank_mask:0xe
 // GFX11: v_dot2_f32_f16_e64_dpp v0, v1, v2, v3 neg_lo:[1,1,0] neg_hi:[1,0,1] quad_perm:[3,2,1,0] row_mask:0xf bank_mask:0xe ; encoding: [0x00,0x05,0x13,0xcc,0xfa,0x04,0x0e,0x64,0x01,0x1b,0x00,0xfe]
 
 v_fma_mix_f32 v0, v1, v2, v3 op_sel:[0,0,0] row_ror:7 bank_mask:0x1 bound_ctrl:0
-// GFX11: v_fma_mix_f32_e64_dpp v0, v1, v2, v3 row_ror:7 row_mask:0xf bank_mask:0x1 bound_ctrl:1 ; encoding: [0x00,0x00,0x20,0xcc,0xfa,0x04,0x0e,0x04,0x01,0x27,0x09,0xf1]
+// GFX11: v_fma_mix_f32_e64_dpp v0, v1, v2, v3 row_ror:7 row_mask:0xf bank_mask:0x1 ; encoding: [0x00,0x00,0x20,0xcc,0xfa,0x04,0x0e,0x04,0x01,0x27,0x01,0xf1]
 
 v_fma_mixhi_f16 v0, v1, v2, v3 op_sel_hi:[1,1,1] clamp quad_perm:[0,2,3,1] row_mask:0x0
 // GFX11: v_fma_mixhi_f16_e64_dpp v0, v1, v2, v3 op_sel_hi:[1,1,1] clamp quad_perm:[0,2,3,1] row_mask:0x0 bank_mask:0xf ; encoding: [0x00,0xc0,0x22,0xcc,0xfa,0x04,0x0e,0x1c,0x01,0x78,0x00,0x0f]