5 years ago · 9c0dcead36
--- a/docs/AMDGPU/AMDGPUAsmGFX8.rst
+++ b/docs/AMDGPU/AMDGPUAsmGFX8.rst
@@ -566,7 +566,7 @@ SOPC
 
				     s_cmp_lg_u64                   :ref:`ssrc0<amdgpu_synid8_ssrc64_0>`,    :ref:`ssrc1<amdgpu_synid8_ssrc64_0>`
			
 
				     s_cmp_lt_i32                   :ref:`ssrc0<amdgpu_synid8_ssrc32_0>`,    :ref:`ssrc1<amdgpu_synid8_ssrc32_0>`
			
 
				     s_cmp_lt_u32                   :ref:`ssrc0<amdgpu_synid8_ssrc32_0>`,    :ref:`ssrc1<amdgpu_synid8_ssrc32_0>`
			
 
				-    s_set_gpr_idx_on               :ref:`ssrc<amdgpu_synid8_ssrc32_0>`,     :ref:`imm4<amdgpu_synid8_imm4>`
			
 
				+    s_set_gpr_idx_on               :ref:`ssrc<amdgpu_synid8_ssrc32_0>`,     :ref:`imask<amdgpu_synid8_imask>`
			
 
				     s_setvskip                     :ref:`ssrc0<amdgpu_synid8_ssrc32_0>`,    :ref:`ssrc1<amdgpu_synid8_ssrc32_0>`
			
 
				 
			
 
				 SOPK
			
@@ -624,7 +624,7 @@ SOPP
 
				     s_nop                          :ref:`imm16<amdgpu_synid8_bimm16>`
			
 
				     s_sendmsg                      :ref:`msg<amdgpu_synid8_msg>`
			
 
				     s_sendmsghalt                  :ref:`msg<amdgpu_synid8_msg>`
			
 
				-    s_set_gpr_idx_mode             :ref:`imm4<amdgpu_synid8_imm4>`
			
 
				+    s_set_gpr_idx_mode             :ref:`imask<amdgpu_synid8_imask>`
			
 
				     s_set_gpr_idx_off
			
 
				     s_sethalt                      :ref:`imm16<amdgpu_synid8_bimm16>`
			
 
				     s_setkill                      :ref:`imm16<amdgpu_synid8_bimm16>`
			
@@ -1756,7 +1756,7 @@ VOPC
 
				     gfx8_fimm16
			
 
				     gfx8_fimm32
			
 
				     gfx8_hwreg
			
 
				-    gfx8_imm4
			
 
				+    gfx8_imask
			
 
				     gfx8_label
			
 
				     gfx8_msg
			
 
				     gfx8_param
			
--- a/docs/AMDGPU/AMDGPUAsmGFX9.rst
+++ b/docs/AMDGPU/AMDGPUAsmGFX9.rst
@@ -736,7 +736,7 @@ SOPC
 
				     s_cmp_lg_u64                   :ref:`ssrc0<amdgpu_synid9_ssrc64_0>`,    :ref:`ssrc1<amdgpu_synid9_ssrc64_0>`
			
 
				     s_cmp_lt_i32                   :ref:`ssrc0<amdgpu_synid9_ssrc32_0>`,    :ref:`ssrc1<amdgpu_synid9_ssrc32_0>`
			
 
				     s_cmp_lt_u32                   :ref:`ssrc0<amdgpu_synid9_ssrc32_0>`,    :ref:`ssrc1<amdgpu_synid9_ssrc32_0>`
			
 
				-    s_set_gpr_idx_on               :ref:`ssrc<amdgpu_synid9_ssrc32_0>`,     :ref:`imm4<amdgpu_synid9_imm4>`
			
 
				+    s_set_gpr_idx_on               :ref:`ssrc<amdgpu_synid9_ssrc32_0>`,     :ref:`imask<amdgpu_synid9_imask>`
			
 
				     s_setvskip                     :ref:`ssrc0<amdgpu_synid9_ssrc32_0>`,    :ref:`ssrc1<amdgpu_synid9_ssrc32_0>`
			
 
				 
			
 
				 SOPK
			
@@ -796,7 +796,7 @@ SOPP
 
				     s_nop                          :ref:`imm16<amdgpu_synid9_bimm16>`
			
 
				     s_sendmsg                      :ref:`msg<amdgpu_synid9_msg>`
			
 
				     s_sendmsghalt                  :ref:`msg<amdgpu_synid9_msg>`
			
 
				-    s_set_gpr_idx_mode             :ref:`imm4<amdgpu_synid9_imm4>`
			
 
				+    s_set_gpr_idx_mode             :ref:`imask<amdgpu_synid9_imask>`
			
 
				     s_set_gpr_idx_off
			
 
				     s_sethalt                      :ref:`imm16<amdgpu_synid9_bimm16>`
			
 
				     s_setkill                      :ref:`imm16<amdgpu_synid9_bimm16>`
			
@@ -2010,7 +2010,7 @@ VOPC
 
				     gfx9_fimm16
			
 
				     gfx9_fimm32
			
 
				     gfx9_hwreg
			
 
				-    gfx9_imm4
			
 
				+    gfx9_imask
			
 
				     gfx9_label
			
 
				     gfx9_msg
			
 
				     gfx9_param
			
--- a/docs/AMDGPU/gfx10_bimm16.rst
+++ b/docs/AMDGPU/gfx10_bimm16.rst
@@ -10,5 +10,5 @@
 
				 imm16
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 16 bits.
			
 
				+A 16-bit :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range -32768..65535.
			
 
				 
			
--- a/docs/AMDGPU/gfx10_bimm32.rst
+++ b/docs/AMDGPU/gfx10_bimm32.rst
@@ -10,5 +10,5 @@
 
				 imm32
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 32 bits.
			
 
				+An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value is truncated to 32 bits.
			
 
				 
			
--- a/docs/AMDGPU/gfx10_data_mimg_atomic_cmp.rst
+++ b/docs/AMDGPU/gfx10_data_mimg_atomic_cmp.rst
@@ -21,7 +21,7 @@ Optionally may serve as an output data:
 
				 * :ref:`dmask<amdgpu_synid_dmask>` may specify 2 data elements for 32-bit-per-pixel surfaces or 4 data elements for 64-bit-per-pixel surfaces. Each data element occupies 1 dword.
			
 
				 * :ref:`tfe<amdgpu_synid_tfe>` adds 1 dword if specified.
			
 
				 
			
 
				-  Note. The surface data format is indicated in the image resource constant but not in the instruction.
			
 
				+  Note: the surface data format is indicated in the image resource constant but not in the instruction.
			
 
				 
			
 
				 
			
 
				 *Operands:* :ref:`v<amdgpu_synid_v>`
			
--- a/docs/AMDGPU/gfx10_data_mimg_atomic_reg.rst
+++ b/docs/AMDGPU/gfx10_data_mimg_atomic_reg.rst
@@ -21,6 +21,6 @@ Optionally may serve as an output data:
 
				 * :ref:`dmask<amdgpu_synid_dmask>` may specify 1 data element for 32-bit-per-pixel surfaces or 2 data elements for 64-bit-per-pixel surfaces. Each data element occupies 1 dword.
			
 
				 * :ref:`tfe<amdgpu_synid_tfe>` adds 1 dword if specified.
			
 
				 
			
 
				-  Note. The surface data format is indicated in the image resource constant but not in the instruction.
			
 
				+  Note: the surface data format is indicated in the image resource constant but not in the instruction.
			
 
				 
			
 
				 *Operands:* :ref:`v<amdgpu_synid_v>`
			
--- a/docs/AMDGPU/gfx10_fimm16.rst
+++ b/docs/AMDGPU/gfx10_fimm16.rst
@@ -10,5 +10,6 @@
 
				 imm32
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>` or a :ref:`floating-point_number<amdgpu_synid_floating-point_number>`. The number is converted to *f16* as described :ref:`here<amdgpu_synid_lit_conv>`.
			
 
				+A :ref:`floating-point_number<amdgpu_synid_floating-point_number>`, an :ref:`integer_number<amdgpu_synid_integer_number>`, or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`.
			
 
				+The value is converted to *f16* as described :ref:`here<amdgpu_synid_fp_conv>`.
			
 
				 
			
--- a/docs/AMDGPU/gfx10_fimm32.rst
+++ b/docs/AMDGPU/gfx10_fimm32.rst
@@ -10,5 +10,6 @@
 
				 imm32
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>` or a :ref:`floating-point_number<amdgpu_synid_floating-point_number>`. The value is converted to *f32* as described :ref:`here<amdgpu_synid_lit_conv>`.
			
 
				+A :ref:`floating-point_number<amdgpu_synid_floating-point_number>`, an :ref:`integer_number<amdgpu_synid_integer_number>`, or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`.
			
 
				+The value is converted to *f32* as described :ref:`here<amdgpu_synid_fp_conv>`.
			
 
				 
			
--- a/docs/AMDGPU/gfx10_hwreg.rst
+++ b/docs/AMDGPU/gfx10_hwreg.rst
@@ -14,18 +14,21 @@ Bits of a hardware register being accessed.
 
				 
			
 
				 The bits of this operand have the following meaning:
			
 
				 
			
 
				-    ============ ===================================
			
 
				-    Bits         Description
			
 
				-    ============ ===================================
			
 
				-    5:0          Register *id*.
			
 
				-    10:6         First bit *offset* (0..31).
			
 
				-    15:11        *Size* in bits (1..32).
			
 
				-    ============ ===================================
			
 
				+    ======= ===================== ============
			
 
				+    Bits    Description           Value Range
			
 
				+    ======= ===================== ============
			
 
				+    5:0     Register *id*.        0..63
			
 
				+    10:6    First bit *offset*.   0..31
			
 
				+    15:11   *Size* in bits.       1..32
			
 
				+    ======= ===================== ============
			
 
				 
			
 
				-This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_synid_integer_number>` or using the syntax described below.
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..0xFFFF.
			
 
				+* An *hwreg* value described below.
			
 
				 
			
 
				     ==================================== ============================================================================
			
 
				-    Syntax                               Description
			
 
				+    Hwreg Value Syntax                   Description
			
 
				     ==================================== ============================================================================
			
 
				     hwreg({0..63})                       All bits of a register indicated by its *id*.
			
 
				     hwreg(<*name*>)                      All bits of a register indicated by its *name*.
			
@@ -33,7 +36,8 @@ This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_s
 
				     hwreg(<*name*>, {0..31}, {1..32})    Register bits indicated by register *name*, first bit *offset* and *size*.
			
 
				     ==================================== ============================================================================
			
 
				 
			
 
				-Register *id*, *offset* and *size* must be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`.
			
 
				+Numeric values may be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`
			
 
				+or :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				 Defined register *names* include:
			
 
				 
			
@@ -62,7 +66,16 @@ Examples:
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-    s_getreg_b32 s2, 0x6
			
 
				+    reg = 1
			
 
				+    offset = 2
			
 
				+    size = 4
			
 
				+    hwreg_enc = reg | (offset << 6) | ((size - 1) << 11)
			
 
				+
			
 
				+    s_getreg_b32 s2, 0x1881
			
 
				+    s_getreg_b32 s2, hwreg_enc                     // the same as above
			
 
				+    s_getreg_b32 s2, hwreg(1, 2, 4)                // the same as above
			
 
				+    s_getreg_b32 s2, hwreg(reg, offset, size)      // the same as above
			
 
				+
			
 
				     s_getreg_b32 s2, hwreg(15)
			
 
				     s_getreg_b32 s2, hwreg(51, 1, 31)
			
 
				     s_getreg_b32 s2, hwreg(HW_REG_LDS_ALLOC, 0, 1)
			
--- a/docs/AMDGPU/gfx10_label.rst
+++ b/docs/AMDGPU/gfx10_label.rst
@@ -12,19 +12,26 @@ label
 
				 
			
 
				 A branch target which is a 16-bit signed integer treated as a PC-relative dword offset.
			
 
				 
			
 
				-This operand may be specified as:
			
 
				+This operand may be specified as one of the following:
			
 
				 
			
 
				-* An :ref:`integer_number<amdgpu_synid_integer_number>`. The number is truncated to 16 bits.
			
 
				-* An :ref:`absolute_expression<amdgpu_synid_absolute_expression>` which must start with an :ref:`integer_number<amdgpu_synid_integer_number>`. The value of the expression is truncated to 16 bits.
			
 
				-* A :ref:`symbol<amdgpu_synid_symbol>` (for example, a label). The value is handled as a 16-bit PC-relative dword offset to be resolved by a linker.
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range -32768..65535.
			
 
				+* A :ref:`symbol<amdgpu_synid_symbol>` (for example, a label) representing a relocatable address in the same compilation unit where it is referred from. The value is handled as a 16-bit PC-relative dword offset to be resolved by a linker.
			
 
				 
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				   offset = 30
			
 
				-  s_branch loop_end
			
 
				-  s_branch 2 + offset
			
 
				+  label_1:
			
 
				+  label_2 = . + 4
			
 
				+
			
 
				   s_branch 32
			
 
				-  loop_end:
			
 
				+  s_branch offset + 2
			
 
				+  s_branch label_1
			
 
				+  s_branch label_2
			
 
				+  s_branch label_3
			
 
				+  s_branch label_4
			
 
				+
			
 
				+  label_3 = label_2 + 4
			
 
				+  label_4:
			
 
				 
			
--- a/docs/AMDGPU/gfx10_msg.rst
+++ b/docs/AMDGPU/gfx10_msg.rst
@@ -12,24 +12,29 @@ msg
 
				 
			
 
				 A 16-bit message code. The bits of this operand have the following meaning:
			
 
				 
			
 
				-    ============ ======================================================
			
 
				-    Bits         Description
			
 
				-    ============ ======================================================
			
 
				-    3:0          Message *type*.
			
 
				-    6:4          Optional *operation*.
			
 
				-    9:7          Optional *parameters*.
			
 
				-    15:10        Unused.
			
 
				-    ============ ======================================================
			
 
				-
			
 
				-This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_synid_integer_number>` or using the syntax described below:
			
 
				-
			
 
				-    ======================================== ========================================================================
			
 
				-    Syntax                                   Description
			
 
				-    ======================================== ========================================================================
			
 
				-    sendmsg(<*type*>)                        A message identified by its *type*.
			
 
				-    sendmsg(<*type*>, <*op*>)                A message identified by its *type* and *operation*.
			
 
				-    sendmsg(<*type*>, <*op*>, <*stream*>)    A message identified by its *type* and *operation* with a stream *id*.
			
 
				-    ======================================== ========================================================================
			
 
				+    ============ =============================== ===============
			
 
				+    Bits         Description                     Value Range
			
 
				+    ============ =============================== ===============
			
 
				+    3:0          Message *type*.                 0..15
			
 
				+    6:4          Optional *operation*.           0..7
			
 
				+    7:7          Unused.                         \-
			
 
				+    9:8          Optional *stream*.              0..3
			
 
				+    15:10        Unused.                         \-
			
 
				+    ============ =============================== ===============
			
 
				+
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..0xFFFF.
			
 
				+* A *sendmsg* value described below.
			
 
				+
			
 
				+    ==================================== ====================================================
			
 
				+    Sendmsg Value Syntax                 Description
			
 
				+    ==================================== ====================================================
			
 
				+    sendmsg(<*type*>)                    A message identified by its *type*.
			
 
				+    sendmsg(<*type*>,<*op*>)             A message identified by its *type* and *operation*.
			
 
				+    sendmsg(<*type*>,<*op*>,<*stream*>)  A message identified by its *type* and *operation*
			
 
				+                                         with a stream *id*.
			
 
				+    ==================================== ====================================================
			
 
				 
			
 
				 *Type* may be specified using message *name* or message *id*.
			
 
				 
			
@@ -37,7 +42,8 @@ This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_s
 
				 
			
 
				 Stream *id* is an integer in the range 0..3.
			
 
				 
			
 
				-Message *id*, operation *id* and stream *id* must be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`.
			
 
				+Numeric values may be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`
			
 
				+or :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				 Each message type supports specific operations:
			
 
				 
			
@@ -60,16 +66,32 @@ Each message type supports specific operations:
 
				     \                            SYSMSG_OP_TTRACE_PC            4            \-
			
 
				     ================= ========== ============================== ============ ==========
			
 
				 
			
 
				+*Sendmsg* arguments are validated depending on how *type* value is specified:
			
 
				+
			
 
				+* If message *type* is specified by name, arguments values must satisfy limitations detailed in the table above.
			
 
				+* If message *type* is specified as a number, each argument must not exceed corresponding value range (see the first table).
			
 
				+
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				+    // numeric message code
			
 
				+    msg = 0x10
			
 
				     s_sendmsg 0x12
			
 
				+    s_sendmsg msg + 2
			
 
				+
			
 
				+    // sendmsg with strict arguments validation
			
 
				     s_sendmsg sendmsg(MSG_INTERRUPT)
			
 
				-    s_sendmsg sendmsg(MSG_GET_DOORBELL)
			
 
				-    s_sendmsg sendmsg(2, GS_OP_CUT)
			
 
				     s_sendmsg sendmsg(MSG_GS, GS_OP_EMIT)
			
 
				     s_sendmsg sendmsg(MSG_GS, 2)
			
 
				     s_sendmsg sendmsg(MSG_GS_DONE, GS_OP_EMIT_CUT, 1)
			
 
				     s_sendmsg sendmsg(MSG_SYSMSG, SYSMSG_OP_TTRACE_PC)
			
 
				+    s_sendmsg sendmsg(MSG_GET_DOORBELL)
			
 
				+
			
 
				+    // sendmsg with validation of value range only
			
 
				+    msg = 2
			
 
				+    op = 3
			
 
				+    stream = 1
			
 
				+    s_sendmsg sendmsg(msg, op, stream)
			
 
				+    s_sendmsg sendmsg(2, GS_OP_CUT)
			
 
				 
			
--- a/docs/AMDGPU/gfx10_perm_smem.rst
+++ b/docs/AMDGPU/gfx10_perm_smem.rst
@@ -12,7 +12,8 @@ imm3
 
				 
			
 
				 A bit mask which indicates request permissions.
			
 
				 
			
 
				-This operand must be specified as an :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 7 bits, but only 3 low bits are significant.
			
 
				+This operand must be specified as an :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`.
			
 
				+The value is truncated to 7 bits, but only 3 low bits are significant.
			
 
				 
			
 
				     ============ ==============================
			
 
				     Bit Number   Description
			
--- a/docs/AMDGPU/gfx10_simm16.rst
+++ b/docs/AMDGPU/gfx10_simm16.rst
@@ -10,5 +10,5 @@
 
				 imm16
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 16 bits and then sign-extended to 32 bits.
			
 
				+An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range -32768..65535.
			
 
				 
			
--- a/docs/AMDGPU/gfx10_uimm16.rst
+++ b/docs/AMDGPU/gfx10_uimm16.rst
@@ -10,5 +10,5 @@
 
				 imm16
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 16 bits and then zero-extended to 32 bits.
			
 
				+An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..65535.
			
 
				 
			
--- a/docs/AMDGPU/gfx10_waitcnt.rst
+++ b/docs/AMDGPU/gfx10_waitcnt.rst
@@ -14,30 +14,31 @@ Counts of outstanding instructions to wait for.
 
				 
			
 
				 The bits of this operand have the following meaning:
			
 
				 
			
 
				-    ============ ======================================================
			
 
				-    Bits         Description
			
 
				-    ============ ======================================================
			
 
				-    3:0          VM_CNT: vector memory operations count, lower bits.
			
 
				-    6:4          EXP_CNT: export count.
			
 
				-    11:8         LGKM_CNT: LDS, GDS, Constant and Message count.
			
 
				-    15:14        VM_CNT: vector memory operations count, upper bits.
			
 
				-    ============ ======================================================
			
 
				-
			
 
				-This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_synid_integer_number>`
			
 
				-or as a combination of the following symbolic helpers:
			
 
				+    ========== ========= ================================================ ============
			
 
				+    High Bits  Low Bits  Description                                      Value Range
			
 
				+    ========== ========= ================================================ ============
			
 
				+    15:14      3:0       VM_CNT: vector memory operations count.          0..63
			
 
				+    \-         6:4       EXP_CNT: export count.                           0..7
			
 
				+    \-         11:8      LGKM_CNT: LDS, GDS, Constant and Message count.  0..15
			
 
				+    ========== ========= ================================================ ============
			
 
				+
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..0xFFFF.
			
 
				+* A combination of *vmcnt*, *expcnt*, *lgkmcnt* and other values described below.
			
 
				 
			
 
				     ====================== ======================================================================
			
 
				     Syntax                 Description
			
 
				     ====================== ======================================================================
			
 
				-    vmcnt(<*N*>)           VM_CNT value. *N* must not exceed the largest VM_CNT value.
			
 
				-    expcnt(<*N*>)          EXP_CNT value. *N* must not exceed the largest EXP_CNT value.
			
 
				-    lgkmcnt(<*N*>)         LGKM_CNT value. *N* must not exceed the largest LGKM_CNT value.
			
 
				-    vmcnt_sat(<*N*>)       VM_CNT value computed as min(*N*, the largest VM_CNT value).
			
 
				-    expcnt_sat(<*N*>)      EXP_CNT value computed as min(*N*, the largest EXP_CNT value).
			
 
				-    lgkmcnt_sat(<*N*>)     LGKM_CNT value computed as min(*N*, the largest LGKM_CNT value).
			
 
				+    vmcnt(<*N*>)           A VM_CNT value. *N* must not exceed the largest VM_CNT value.
			
 
				+    expcnt(<*N*>)          An EXP_CNT value. *N* must not exceed the largest EXP_CNT value.
			
 
				+    lgkmcnt(<*N*>)         An LGKM_CNT value. *N* must not exceed the largest LGKM_CNT value.
			
 
				+    vmcnt_sat(<*N*>)       A VM_CNT value computed as min(*N*, the largest VM_CNT value).
			
 
				+    expcnt_sat(<*N*>)      An EXP_CNT value computed as min(*N*, the largest EXP_CNT value).
			
 
				+    lgkmcnt_sat(<*N*>)     An LGKM_CNT value computed as min(*N*, the largest LGKM_CNT value).
			
 
				     ====================== ======================================================================
			
 
				 
			
 
				-These helpers may be specified in any order. Ampersands and commas may be used as optional separators.
			
 
				+These values may be specified in any order. Spaces, ampersands and commas may be used as optional separators.
			
 
				 
			
 
				 *N* is either an
			
 
				 :ref:`integer number<amdgpu_synid_integer_number>` or an
			
@@ -47,10 +48,18 @@ Examples:
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-    s_waitcnt 0
			
 
				+    vm_cnt = 1
			
 
				+    exp_cnt = 2
			
 
				+    lgkm_cnt = 3
			
 
				+    cnt = vm_cnt | (exp_cnt << 4) | (lgkm_cnt << 8)
			
 
				+
			
 
				+    s_waitcnt cnt
			
 
				+    s_waitcnt 1 | (2 << 4) | (3 << 8)                          // the same as above
			
 
				+    s_waitcnt vmcnt(1) expcnt(2) lgkmcnt(3)                    // the same as above
			
 
				+    s_waitcnt vmcnt(vm_cnt) expcnt(exp_cnt) lgkmcnt(lgkm_cnt)  // the same as above
			
 
				+
			
 
				     s_waitcnt vmcnt(1)
			
 
				     s_waitcnt expcnt(2) lgkmcnt(3)
			
 
				-    s_waitcnt vmcnt(1) expcnt(2) lgkmcnt(3)
			
 
				     s_waitcnt vmcnt(1), expcnt(2), lgkmcnt(3)
			
 
				     s_waitcnt vmcnt(1) & lgkmcnt_sat(100) & expcnt(2)
			
 
				 
			
--- a/docs/AMDGPU/gfx7_bimm16.rst
+++ b/docs/AMDGPU/gfx7_bimm16.rst
@@ -10,5 +10,5 @@
 
				 imm16
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 16 bits.
			
 
				+A 16-bit :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range -32768..65535.
			
 
				 
			
--- a/docs/AMDGPU/gfx7_bimm32.rst
+++ b/docs/AMDGPU/gfx7_bimm32.rst
@@ -10,5 +10,5 @@
 
				 imm32
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 32 bits.
			
 
				+An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value is truncated to 32 bits.
			
 
				 
			
--- a/docs/AMDGPU/gfx7_data_mimg_atomic_cmp.rst
+++ b/docs/AMDGPU/gfx7_data_mimg_atomic_cmp.rst
@@ -21,7 +21,7 @@ Optionally may serve as an output data:
 
				 * :ref:`dmask<amdgpu_synid_dmask>` may specify 2 data elements for 32-bit-per-pixel surfaces or 4 data elements for 64-bit-per-pixel surfaces. Each data element occupies 1 dword.
			
 
				 * :ref:`tfe<amdgpu_synid_tfe>` adds 1 dword if specified.
			
 
				 
			
 
				-  Note. The surface data format is indicated in the image resource constant but not in the instruction.
			
 
				+  Note: the surface data format is indicated in the image resource constant but not in the instruction.
			
 
				 
			
 
				 
			
 
				 *Operands:* :ref:`v<amdgpu_synid_v>`
			
--- a/docs/AMDGPU/gfx7_data_mimg_atomic_reg.rst
+++ b/docs/AMDGPU/gfx7_data_mimg_atomic_reg.rst
@@ -21,6 +21,6 @@ Optionally may serve as an output data:
 
				 * :ref:`dmask<amdgpu_synid_dmask>` may specify 1 data element for 32-bit-per-pixel surfaces or 2 data elements for 64-bit-per-pixel surfaces. Each data element occupies 1 dword.
			
 
				 * :ref:`tfe<amdgpu_synid_tfe>` adds 1 dword if specified.
			
 
				 
			
 
				-  Note. The surface data format is indicated in the image resource constant but not in the instruction.
			
 
				+  Note: the surface data format is indicated in the image resource constant but not in the instruction.
			
 
				 
			
 
				 *Operands:* :ref:`v<amdgpu_synid_v>`
			
--- a/docs/AMDGPU/gfx7_fimm32.rst
+++ b/docs/AMDGPU/gfx7_fimm32.rst
@@ -10,5 +10,6 @@
 
				 imm32
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>` or a :ref:`floating-point_number<amdgpu_synid_floating-point_number>`. The value is converted to *f32* as described :ref:`here<amdgpu_synid_lit_conv>`.
			
 
				+A :ref:`floating-point_number<amdgpu_synid_floating-point_number>`, an :ref:`integer_number<amdgpu_synid_integer_number>`, or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`.
			
 
				+The value is converted to *f32* as described :ref:`here<amdgpu_synid_fp_conv>`.
			
 
				 
			
--- a/docs/AMDGPU/gfx7_hwreg.rst
+++ b/docs/AMDGPU/gfx7_hwreg.rst
@@ -14,18 +14,21 @@ Bits of a hardware register being accessed.
 
				 
			
 
				 The bits of this operand have the following meaning:
			
 
				 
			
 
				-    ============ ===================================
			
 
				-    Bits         Description
			
 
				-    ============ ===================================
			
 
				-    5:0          Register *id*.
			
 
				-    10:6         First bit *offset* (0..31).
			
 
				-    15:11        *Size* in bits (1..32).
			
 
				-    ============ ===================================
			
 
				+    ======= ===================== ============
			
 
				+    Bits    Description           Value Range
			
 
				+    ======= ===================== ============
			
 
				+    5:0     Register *id*.        0..63
			
 
				+    10:6    First bit *offset*.   0..31
			
 
				+    15:11   *Size* in bits.       1..32
			
 
				+    ======= ===================== ============
			
 
				 
			
 
				-This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_synid_integer_number>` or using the syntax described below.
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..0xFFFF.
			
 
				+* An *hwreg* value described below.
			
 
				 
			
 
				     ==================================== ============================================================================
			
 
				-    Syntax                               Description
			
 
				+    Hwreg Value Syntax                   Description
			
 
				     ==================================== ============================================================================
			
 
				     hwreg({0..63})                       All bits of a register indicated by its *id*.
			
 
				     hwreg(<*name*>)                      All bits of a register indicated by its *name*.
			
@@ -33,7 +36,8 @@ This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_s
 
				     hwreg(<*name*>, {0..31}, {1..32})    Register bits indicated by register *name*, first bit *offset* and *size*.
			
 
				     ==================================== ============================================================================
			
 
				 
			
 
				-Register *id*, *offset* and *size* must be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`.
			
 
				+Numeric values may be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`
			
 
				+or :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				 Defined register *names* include:
			
 
				 
			
@@ -53,7 +57,16 @@ Examples:
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-    s_getreg_b32 s2, 0x6
			
 
				+    reg = 1
			
 
				+    offset = 2
			
 
				+    size = 4
			
 
				+    hwreg_enc = reg | (offset << 6) | ((size - 1) << 11)
			
 
				+
			
 
				+    s_getreg_b32 s2, 0x1881
			
 
				+    s_getreg_b32 s2, hwreg_enc                     // the same as above
			
 
				+    s_getreg_b32 s2, hwreg(1, 2, 4)                // the same as above
			
 
				+    s_getreg_b32 s2, hwreg(reg, offset, size)      // the same as above
			
 
				+
			
 
				     s_getreg_b32 s2, hwreg(15)
			
 
				     s_getreg_b32 s2, hwreg(51, 1, 31)
			
 
				     s_getreg_b32 s2, hwreg(HW_REG_LDS_ALLOC, 0, 1)
			
--- a/docs/AMDGPU/gfx7_label.rst
+++ b/docs/AMDGPU/gfx7_label.rst
@@ -12,19 +12,26 @@ label
 
				 
			
 
				 A branch target which is a 16-bit signed integer treated as a PC-relative dword offset.
			
 
				 
			
 
				-This operand may be specified as:
			
 
				+This operand may be specified as one of the following:
			
 
				 
			
 
				-* An :ref:`integer_number<amdgpu_synid_integer_number>`. The number is truncated to 16 bits.
			
 
				-* An :ref:`absolute_expression<amdgpu_synid_absolute_expression>` which must start with an :ref:`integer_number<amdgpu_synid_integer_number>`. The value of the expression is truncated to 16 bits.
			
 
				-* A :ref:`symbol<amdgpu_synid_symbol>` (for example, a label). The value is handled as a 16-bit PC-relative dword offset to be resolved by a linker.
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range -32768..65535.
			
 
				+* A :ref:`symbol<amdgpu_synid_symbol>` (for example, a label) representing a relocatable address in the same compilation unit where it is referred from. The value is handled as a 16-bit PC-relative dword offset to be resolved by a linker.
			
 
				 
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				   offset = 30
			
 
				-  s_branch loop_end
			
 
				-  s_branch 2 + offset
			
 
				+  label_1:
			
 
				+  label_2 = . + 4
			
 
				+
			
 
				   s_branch 32
			
 
				-  loop_end:
			
 
				+  s_branch offset + 2
			
 
				+  s_branch label_1
			
 
				+  s_branch label_2
			
 
				+  s_branch label_3
			
 
				+  s_branch label_4
			
 
				+
			
 
				+  label_3 = label_2 + 4
			
 
				+  label_4:
			
 
				 
			
--- a/docs/AMDGPU/gfx7_msg.rst
+++ b/docs/AMDGPU/gfx7_msg.rst
@@ -12,24 +12,29 @@ msg
 
				 
			
 
				 A 16-bit message code. The bits of this operand have the following meaning:
			
 
				 
			
 
				-    ============ ======================================================
			
 
				-    Bits         Description
			
 
				-    ============ ======================================================
			
 
				-    3:0          Message *type*.
			
 
				-    6:4          Optional *operation*.
			
 
				-    9:7          Optional *parameters*.
			
 
				-    15:10        Unused.
			
 
				-    ============ ======================================================
			
 
				-
			
 
				-This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_synid_integer_number>` or using the syntax described below:
			
 
				-
			
 
				-    ======================================== ========================================================================
			
 
				-    Syntax                                   Description
			
 
				-    ======================================== ========================================================================
			
 
				-    sendmsg(<*type*>)                        A message identified by its *type*.
			
 
				-    sendmsg(<*type*>, <*op*>)                A message identified by its *type* and *operation*.
			
 
				-    sendmsg(<*type*>, <*op*>, <*stream*>)    A message identified by its *type* and *operation* with a stream *id*.
			
 
				-    ======================================== ========================================================================
			
 
				+    ============ =============================== ===============
			
 
				+    Bits         Description                     Value Range
			
 
				+    ============ =============================== ===============
			
 
				+    3:0          Message *type*.                 0..15
			
 
				+    6:4          Optional *operation*.           0..7
			
 
				+    7:7          Unused.                         \-
			
 
				+    9:8          Optional *stream*.              0..3
			
 
				+    15:10        Unused.                         \-
			
 
				+    ============ =============================== ===============
			
 
				+
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..0xFFFF.
			
 
				+* A *sendmsg* value described below.
			
 
				+
			
 
				+    ==================================== ====================================================
			
 
				+    Sendmsg Value Syntax                 Description
			
 
				+    ==================================== ====================================================
			
 
				+    sendmsg(<*type*>)                    A message identified by its *type*.
			
 
				+    sendmsg(<*type*>,<*op*>)             A message identified by its *type* and *operation*.
			
 
				+    sendmsg(<*type*>,<*op*>,<*stream*>)  A message identified by its *type* and *operation*
			
 
				+                                         with a stream *id*.
			
 
				+    ==================================== ====================================================
			
 
				 
			
 
				 *Type* may be specified using message *name* or message *id*.
			
 
				 
			
@@ -37,7 +42,8 @@ This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_s
 
				 
			
 
				 Stream *id* is an integer in the range 0..3.
			
 
				 
			
 
				-Message *id*, operation *id* and stream *id* must be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`.
			
 
				+Numeric values may be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`
			
 
				+or :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				 Each message type supports specific operations:
			
 
				 
			
@@ -58,15 +64,31 @@ Each message type supports specific operations:
 
				     \                            SYSMSG_OP_TTRACE_PC            4            \-
			
 
				     ================= ========== ============================== ============ ==========
			
 
				 
			
 
				+*Sendmsg* arguments are validated depending on how *type* value is specified:
			
 
				+
			
 
				+* If message *type* is specified by name, arguments values must satisfy limitations detailed in the table above.
			
 
				+* If message *type* is specified as a number, each argument must not exceed corresponding value range (see the first table).
			
 
				+
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				+    // numeric message code
			
 
				+    msg = 0x10
			
 
				     s_sendmsg 0x12
			
 
				+    s_sendmsg msg + 2
			
 
				+
			
 
				+    // sendmsg with strict arguments validation
			
 
				     s_sendmsg sendmsg(MSG_INTERRUPT)
			
 
				-    s_sendmsg sendmsg(2, GS_OP_CUT)
			
 
				     s_sendmsg sendmsg(MSG_GS, GS_OP_EMIT)
			
 
				     s_sendmsg sendmsg(MSG_GS, 2)
			
 
				     s_sendmsg sendmsg(MSG_GS_DONE, GS_OP_EMIT_CUT, 1)
			
 
				     s_sendmsg sendmsg(MSG_SYSMSG, SYSMSG_OP_TTRACE_PC)
			
 
				 
			
 
				+    // sendmsg with validation of value range only
			
 
				+    msg = 2
			
 
				+    op = 3
			
 
				+    stream = 1
			
 
				+    s_sendmsg sendmsg(msg, op, stream)
			
 
				+    s_sendmsg sendmsg(2, GS_OP_CUT)
			
 
				+
			
--- a/docs/AMDGPU/gfx7_simm16.rst
+++ b/docs/AMDGPU/gfx7_simm16.rst
@@ -10,5 +10,5 @@
 
				 imm16
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 16 bits and then sign-extended to 32 bits.
			
 
				+An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range -32768..65535.
			
 
				 
			
--- a/docs/AMDGPU/gfx7_uimm16.rst
+++ b/docs/AMDGPU/gfx7_uimm16.rst
@@ -10,5 +10,5 @@
 
				 imm16
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 16 bits and then zero-extended to 32 bits.
			
 
				+An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..65535.
			
 
				 
			
--- a/docs/AMDGPU/gfx7_waitcnt.rst
+++ b/docs/AMDGPU/gfx7_waitcnt.rst
@@ -14,29 +14,31 @@ Counts of outstanding instructions to wait for.
 
				 
			
 
				 The bits of this operand have the following meaning:
			
 
				 
			
 
				-    ============ ======================================================
			
 
				-    Bits         Description
			
 
				-    ============ ======================================================
			
 
				-    3:0          VM_CNT: vector memory operations count.
			
 
				-    6:4          EXP_CNT: export count.
			
 
				-    12:8         LGKM_CNT: LDS, GDS, Constant and Message count.
			
 
				-    ============ ======================================================
			
 
				+   ===== ================================================ ============
			
 
				+   Bits  Description                                      Value Range
			
 
				+   ===== ================================================ ============
			
 
				+   3:0   VM_CNT: vector memory operations count.          0..15
			
 
				+   6:4   EXP_CNT: export count.                           0..7
			
 
				+   12:8  LGKM_CNT: LDS, GDS, Constant and Message count.  0..31
			
 
				+   ===== ================================================ ============
			
 
				 
			
 
				-This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_synid_integer_number>`
			
 
				-or as a combination of the following symbolic helpers:
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..0xFFFF.
			
 
				+* A combination of *vmcnt*, *expcnt*, *lgkmcnt* and other values described below.
			
 
				 
			
 
				     ====================== ======================================================================
			
 
				     Syntax                 Description
			
 
				     ====================== ======================================================================
			
 
				-    vmcnt(<*N*>)           VM_CNT value. *N* must not exceed the largest VM_CNT value.
			
 
				-    expcnt(<*N*>)          EXP_CNT value. *N* must not exceed the largest EXP_CNT value.
			
 
				-    lgkmcnt(<*N*>)         LGKM_CNT value. *N* must not exceed the largest LGKM_CNT value.
			
 
				-    vmcnt_sat(<*N*>)       VM_CNT value computed as min(*N*, the largest VM_CNT value).
			
 
				-    expcnt_sat(<*N*>)      EXP_CNT value computed as min(*N*, the largest EXP_CNT value).
			
 
				-    lgkmcnt_sat(<*N*>)     LGKM_CNT value computed as min(*N*, the largest LGKM_CNT value).
			
 
				+    vmcnt(<*N*>)           A VM_CNT value. *N* must not exceed the largest VM_CNT value.
			
 
				+    expcnt(<*N*>)          An EXP_CNT value. *N* must not exceed the largest EXP_CNT value.
			
 
				+    lgkmcnt(<*N*>)         An LGKM_CNT value. *N* must not exceed the largest LGKM_CNT value.
			
 
				+    vmcnt_sat(<*N*>)       A VM_CNT value computed as min(*N*, the largest VM_CNT value).
			
 
				+    expcnt_sat(<*N*>)      An EXP_CNT value computed as min(*N*, the largest EXP_CNT value).
			
 
				+    lgkmcnt_sat(<*N*>)     An LGKM_CNT value computed as min(*N*, the largest LGKM_CNT value).
			
 
				     ====================== ======================================================================
			
 
				 
			
 
				-These helpers may be specified in any order. Ampersands and commas may be used as optional separators.
			
 
				+These values may be specified in any order. Spaces, ampersands and commas may be used as optional separators.
			
 
				 
			
 
				 *N* is either an
			
 
				 :ref:`integer number<amdgpu_synid_integer_number>` or an
			
@@ -46,10 +48,18 @@ Examples:
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-    s_waitcnt 0
			
 
				+    vm_cnt = 1
			
 
				+    exp_cnt = 2
			
 
				+    lgkm_cnt = 3
			
 
				+    cnt = vm_cnt | (exp_cnt << 4) | (lgkm_cnt << 8)
			
 
				+
			
 
				+    s_waitcnt cnt
			
 
				+    s_waitcnt 1 | (2 << 4) | (3 << 8)                          // the same as above
			
 
				+    s_waitcnt vmcnt(1) expcnt(2) lgkmcnt(3)                    // the same as above
			
 
				+    s_waitcnt vmcnt(vm_cnt) expcnt(exp_cnt) lgkmcnt(lgkm_cnt)  // the same as above
			
 
				+
			
 
				     s_waitcnt vmcnt(1)
			
 
				     s_waitcnt expcnt(2) lgkmcnt(3)
			
 
				-    s_waitcnt vmcnt(1) expcnt(2) lgkmcnt(3)
			
 
				     s_waitcnt vmcnt(1), expcnt(2), lgkmcnt(3)
			
 
				     s_waitcnt vmcnt(1) & lgkmcnt_sat(100) & expcnt(2)
			
 
				 
			
--- a/docs/AMDGPU/gfx8_bimm16.rst
+++ b/docs/AMDGPU/gfx8_bimm16.rst
@@ -10,5 +10,5 @@
 
				 imm16
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 16 bits.
			
 
				+A 16-bit :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range -32768..65535.
			
 
				 
			
--- a/docs/AMDGPU/gfx8_bimm32.rst
+++ b/docs/AMDGPU/gfx8_bimm32.rst
@@ -10,5 +10,5 @@
 
				 imm32
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 32 bits.
			
 
				+An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value is truncated to 32 bits.
			
 
				 
			
--- a/docs/AMDGPU/gfx8_data_mimg_atomic_cmp.rst
+++ b/docs/AMDGPU/gfx8_data_mimg_atomic_cmp.rst
@@ -21,7 +21,7 @@ Optionally may serve as an output data:
 
				 * :ref:`dmask<amdgpu_synid_dmask>` may specify 2 data elements for 32-bit-per-pixel surfaces or 4 data elements for 64-bit-per-pixel surfaces. Each data element occupies 1 dword.
			
 
				 * :ref:`tfe<amdgpu_synid_tfe>` adds 1 dword if specified.
			
 
				 
			
 
				-  Note. The surface data format is indicated in the image resource constant but not in the instruction.
			
 
				+  Note: the surface data format is indicated in the image resource constant but not in the instruction.
			
 
				 
			
 
				 
			
 
				 *Operands:* :ref:`v<amdgpu_synid_v>`
			
--- a/docs/AMDGPU/gfx8_data_mimg_atomic_reg.rst
+++ b/docs/AMDGPU/gfx8_data_mimg_atomic_reg.rst
@@ -21,6 +21,6 @@ Optionally may serve as an output data:
 
				 * :ref:`dmask<amdgpu_synid_dmask>` may specify 1 data element for 32-bit-per-pixel surfaces or 2 data elements for 64-bit-per-pixel surfaces. Each data element occupies 1 dword.
			
 
				 * :ref:`tfe<amdgpu_synid_tfe>` adds 1 dword if specified.
			
 
				 
			
 
				-  Note. The surface data format is indicated in the image resource constant but not in the instruction.
			
 
				+  Note: the surface data format is indicated in the image resource constant but not in the instruction.
			
 
				 
			
 
				 *Operands:* :ref:`v<amdgpu_synid_v>`
			
--- a/docs/AMDGPU/gfx8_fimm16.rst
+++ b/docs/AMDGPU/gfx8_fimm16.rst
@@ -10,5 +10,6 @@
 
				 imm32
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>` or a :ref:`floating-point_number<amdgpu_synid_floating-point_number>`. The number is converted to *f16* as described :ref:`here<amdgpu_synid_lit_conv>`.
			
 
				+A :ref:`floating-point_number<amdgpu_synid_floating-point_number>`, an :ref:`integer_number<amdgpu_synid_integer_number>`, or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`.
			
 
				+The value is converted to *f16* as described :ref:`here<amdgpu_synid_fp_conv>`.
			
 
				 
			
--- a/docs/AMDGPU/gfx8_fimm32.rst
+++ b/docs/AMDGPU/gfx8_fimm32.rst
@@ -10,5 +10,6 @@
 
				 imm32
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>` or a :ref:`floating-point_number<amdgpu_synid_floating-point_number>`. The value is converted to *f32* as described :ref:`here<amdgpu_synid_lit_conv>`.
			
 
				+A :ref:`floating-point_number<amdgpu_synid_floating-point_number>`, an :ref:`integer_number<amdgpu_synid_integer_number>`, or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`.
			
 
				+The value is converted to *f32* as described :ref:`here<amdgpu_synid_fp_conv>`.
			
 
				 
			
--- a/docs/AMDGPU/gfx8_hwreg.rst
+++ b/docs/AMDGPU/gfx8_hwreg.rst
@@ -14,18 +14,21 @@ Bits of a hardware register being accessed.
 
				 
			
 
				 The bits of this operand have the following meaning:
			
 
				 
			
 
				-    ============ ===================================
			
 
				-    Bits         Description
			
 
				-    ============ ===================================
			
 
				-    5:0          Register *id*.
			
 
				-    10:6         First bit *offset* (0..31).
			
 
				-    15:11        *Size* in bits (1..32).
			
 
				-    ============ ===================================
			
 
				+    ======= ===================== ============
			
 
				+    Bits    Description           Value Range
			
 
				+    ======= ===================== ============
			
 
				+    5:0     Register *id*.        0..63
			
 
				+    10:6    First bit *offset*.   0..31
			
 
				+    15:11   *Size* in bits.       1..32
			
 
				+    ======= ===================== ============
			
 
				 
			
 
				-This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_synid_integer_number>` or using the syntax described below.
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..0xFFFF.
			
 
				+* An *hwreg* value described below.
			
 
				 
			
 
				     ==================================== ============================================================================
			
 
				-    Syntax                               Description
			
 
				+    Hwreg Value Syntax                   Description
			
 
				     ==================================== ============================================================================
			
 
				     hwreg({0..63})                       All bits of a register indicated by its *id*.
			
 
				     hwreg(<*name*>)                      All bits of a register indicated by its *name*.
			
@@ -33,7 +36,8 @@ This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_s
 
				     hwreg(<*name*>, {0..31}, {1..32})    Register bits indicated by register *name*, first bit *offset* and *size*.
			
 
				     ==================================== ============================================================================
			
 
				 
			
 
				-Register *id*, *offset* and *size* must be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`.
			
 
				+Numeric values may be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`
			
 
				+or :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				 Defined register *names* include:
			
 
				 
			
@@ -53,7 +57,16 @@ Examples:
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-    s_getreg_b32 s2, 0x6
			
 
				+    reg = 1
			
 
				+    offset = 2
			
 
				+    size = 4
			
 
				+    hwreg_enc = reg | (offset << 6) | ((size - 1) << 11)
			
 
				+
			
 
				+    s_getreg_b32 s2, 0x1881
			
 
				+    s_getreg_b32 s2, hwreg_enc                     // the same as above
			
 
				+    s_getreg_b32 s2, hwreg(1, 2, 4)                // the same as above
			
 
				+    s_getreg_b32 s2, hwreg(reg, offset, size)      // the same as above
			
 
				+
			
 
				     s_getreg_b32 s2, hwreg(15)
			
 
				     s_getreg_b32 s2, hwreg(51, 1, 31)
			
 
				     s_getreg_b32 s2, hwreg(HW_REG_LDS_ALLOC, 0, 1)
			
--- a/docs/AMDGPU/gfx8_imask.rst
+++ b/docs/AMDGPU/gfx8_imask.rst
@@ -0,0 +1,66 @@
 
				+..
			
 
				+    **************************************************
			
 
				+    *                                                *
			
 
				+    *   Automatically generated file, do not edit!   *
			
 
				+    *                                                *
			
 
				+    **************************************************
			
 
				+
			
 
				+.. _amdgpu_synid8_imask:
			
 
				+
			
 
				+imask
			
 
				+===========================
			
 
				+
			
 
				+This operand is a mask which controls indexing mode for operands of subsequent instructions.
			
 
				+Bits 0, 1 and 2 control indexing of *src0*, *src1* and *src2*, while bit 3 controls indexing of *dst*.
			
 
				+Value 1 enables indexing and value 0 disables it.
			
 
				+
			
 
				+    ===== ========================================
			
 
				+    Bit   Meaning
			
 
				+    ===== ========================================
			
 
				+    0     Enables or disables *src0* indexing.
			
 
				+    1     Enables or disables *src1* indexing.
			
 
				+    2     Enables or disables *src2* indexing.
			
 
				+    3     Enables or disables *dst* indexing.
			
 
				+    ===== ========================================
			
 
				+
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..15.
			
 
				+* A *gpr_idx* value described below.
			
 
				+
			
 
				+    ==================================== ===========================================
			
 
				+    Gpr_idx Value Syntax                 Description
			
 
				+    ==================================== ===========================================
			
 
				+    gpr_idx(*<operands>*)                Enable indexing for specified *operands*
			
 
				+                                         and disable it for the rest.
			
 
				+                                         *Operands* is a comma-separated list of
			
 
				+                                         values which may include:
			
 
				+
			
 
				+                                         * "SRC0" - enable *src0* indexing.
			
 
				+
			
 
				+                                         * "SRC1" - enable *src1* indexing.
			
 
				+
			
 
				+                                         * "SRC2" - enable *src2* indexing.
			
 
				+
			
 
				+                                         * "DST"  - enable *dst* indexing.
			
 
				+
			
 
				+                                         Each of these values may be specified only
			
 
				+                                         once.
			
 
				+
			
 
				+                                         *Operands* list may be empty; this syntax
			
 
				+                                         disables indexing for all operands.
			
 
				+    ==================================== ===========================================
			
 
				+
			
 
				+Examples:
			
 
				+
			
 
				+.. parsed-literal::
			
 
				+
			
 
				+    s_set_gpr_idx_mode 0
			
 
				+    s_set_gpr_idx_mode gpr_idx()                        // the same as above
			
 
				+
			
 
				+    s_set_gpr_idx_mode 15
			
 
				+    s_set_gpr_idx_mode gpr_idx(DST,SRC0,SRC1,SRC2)      // the same as above
			
 
				+    s_set_gpr_idx_mode gpr_idx(SRC0,SRC1,SRC2,DST)      // the same as above
			
 
				+
			
 
				+    s_set_gpr_idx_mode gpr_idx(DST,SRC1)
			
 
				+
			
--- a/docs/AMDGPU/gfx8_imm4.rst
+++ b/docs/AMDGPU/gfx8_imm4.rst
@@ -1,25 +0,0 @@
 
				-..
			
 
				-    **************************************************
			
 
				-    *                                                *
			
 
				-    *   Automatically generated file, do not edit!   *
			
 
				-    *                                                *
			
 
				-    **************************************************
			
 
				-
			
 
				-.. _amdgpu_synid8_imm4:
			
 
				-
			
 
				-imm4
			
 
				-===========================
			
 
				-
			
 
				-A positive :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 4 bits.
			
 
				-
			
 
				-This operand is a mask which controls indexing mode for operands of subsequent instructions. Value 1 enables indexing and value 0 disables it.
			
 
				-
			
 
				-    ============ ========================================
			
 
				-    Bit          Meaning
			
 
				-    ============ ========================================
			
 
				-    0            Enables or disables *src0* indexing.
			
 
				-    1            Enables or disables *src1* indexing.
			
 
				-    2            Enables or disables *src2* indexing.
			
 
				-    3            Enables or disables *dst* indexing.
			
 
				-    ============ ========================================
			
 
				-
			
--- a/docs/AMDGPU/gfx8_label.rst
+++ b/docs/AMDGPU/gfx8_label.rst
@@ -12,19 +12,26 @@ label
 
				 
			
 
				 A branch target which is a 16-bit signed integer treated as a PC-relative dword offset.
			
 
				 
			
 
				-This operand may be specified as:
			
 
				+This operand may be specified as one of the following:
			
 
				 
			
 
				-* An :ref:`integer_number<amdgpu_synid_integer_number>`. The number is truncated to 16 bits.
			
 
				-* An :ref:`absolute_expression<amdgpu_synid_absolute_expression>` which must start with an :ref:`integer_number<amdgpu_synid_integer_number>`. The value of the expression is truncated to 16 bits.
			
 
				-* A :ref:`symbol<amdgpu_synid_symbol>` (for example, a label). The value is handled as a 16-bit PC-relative dword offset to be resolved by a linker.
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range -32768..65535.
			
 
				+* A :ref:`symbol<amdgpu_synid_symbol>` (for example, a label) representing a relocatable address in the same compilation unit where it is referred from. The value is handled as a 16-bit PC-relative dword offset to be resolved by a linker.
			
 
				 
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				   offset = 30
			
 
				-  s_branch loop_end
			
 
				-  s_branch 2 + offset
			
 
				+  label_1:
			
 
				+  label_2 = . + 4
			
 
				+
			
 
				   s_branch 32
			
 
				-  loop_end:
			
 
				+  s_branch offset + 2
			
 
				+  s_branch label_1
			
 
				+  s_branch label_2
			
 
				+  s_branch label_3
			
 
				+  s_branch label_4
			
 
				+
			
 
				+  label_3 = label_2 + 4
			
 
				+  label_4:
			
 
				 
			
--- a/docs/AMDGPU/gfx8_msg.rst
+++ b/docs/AMDGPU/gfx8_msg.rst
@@ -12,24 +12,29 @@ msg
 
				 
			
 
				 A 16-bit message code. The bits of this operand have the following meaning:
			
 
				 
			
 
				-    ============ ======================================================
			
 
				-    Bits         Description
			
 
				-    ============ ======================================================
			
 
				-    3:0          Message *type*.
			
 
				-    6:4          Optional *operation*.
			
 
				-    9:7          Optional *parameters*.
			
 
				-    15:10        Unused.
			
 
				-    ============ ======================================================
			
 
				-
			
 
				-This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_synid_integer_number>` or using the syntax described below:
			
 
				-
			
 
				-    ======================================== ========================================================================
			
 
				-    Syntax                                   Description
			
 
				-    ======================================== ========================================================================
			
 
				-    sendmsg(<*type*>)                        A message identified by its *type*.
			
 
				-    sendmsg(<*type*>, <*op*>)                A message identified by its *type* and *operation*.
			
 
				-    sendmsg(<*type*>, <*op*>, <*stream*>)    A message identified by its *type* and *operation* with a stream *id*.
			
 
				-    ======================================== ========================================================================
			
 
				+    ============ =============================== ===============
			
 
				+    Bits         Description                     Value Range
			
 
				+    ============ =============================== ===============
			
 
				+    3:0          Message *type*.                 0..15
			
 
				+    6:4          Optional *operation*.           0..7
			
 
				+    7:7          Unused.                         \-
			
 
				+    9:8          Optional *stream*.              0..3
			
 
				+    15:10        Unused.                         \-
			
 
				+    ============ =============================== ===============
			
 
				+
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..0xFFFF.
			
 
				+* A *sendmsg* value described below.
			
 
				+
			
 
				+    ==================================== ====================================================
			
 
				+    Sendmsg Value Syntax                 Description
			
 
				+    ==================================== ====================================================
			
 
				+    sendmsg(<*type*>)                    A message identified by its *type*.
			
 
				+    sendmsg(<*type*>,<*op*>)             A message identified by its *type* and *operation*.
			
 
				+    sendmsg(<*type*>,<*op*>,<*stream*>)  A message identified by its *type* and *operation*
			
 
				+                                         with a stream *id*.
			
 
				+    ==================================== ====================================================
			
 
				 
			
 
				 *Type* may be specified using message *name* or message *id*.
			
 
				 
			
@@ -37,7 +42,8 @@ This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_s
 
				 
			
 
				 Stream *id* is an integer in the range 0..3.
			
 
				 
			
 
				-Message *id*, operation *id* and stream *id* must be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`.
			
 
				+Numeric values may be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`
			
 
				+or :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				 Each message type supports specific operations:
			
 
				 
			
@@ -58,15 +64,31 @@ Each message type supports specific operations:
 
				     \                            SYSMSG_OP_TTRACE_PC            4            \-
			
 
				     ================= ========== ============================== ============ ==========
			
 
				 
			
 
				+*Sendmsg* arguments are validated depending on how *type* value is specified:
			
 
				+
			
 
				+* If message *type* is specified by name, arguments values must satisfy limitations detailed in the table above.
			
 
				+* If message *type* is specified as a number, each argument must not exceed corresponding value range (see the first table).
			
 
				+
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				+    // numeric message code
			
 
				+    msg = 0x10
			
 
				     s_sendmsg 0x12
			
 
				+    s_sendmsg msg + 2
			
 
				+
			
 
				+    // sendmsg with strict arguments validation
			
 
				     s_sendmsg sendmsg(MSG_INTERRUPT)
			
 
				-    s_sendmsg sendmsg(2, GS_OP_CUT)
			
 
				     s_sendmsg sendmsg(MSG_GS, GS_OP_EMIT)
			
 
				     s_sendmsg sendmsg(MSG_GS, 2)
			
 
				     s_sendmsg sendmsg(MSG_GS_DONE, GS_OP_EMIT_CUT, 1)
			
 
				     s_sendmsg sendmsg(MSG_SYSMSG, SYSMSG_OP_TTRACE_PC)
			
 
				 
			
 
				+    // sendmsg with validation of value range only
			
 
				+    msg = 2
			
 
				+    op = 3
			
 
				+    stream = 1
			
 
				+    s_sendmsg sendmsg(msg, op, stream)
			
 
				+    s_sendmsg sendmsg(2, GS_OP_CUT)
			
 
				+
			
--- a/docs/AMDGPU/gfx8_perm_smem.rst
+++ b/docs/AMDGPU/gfx8_perm_smem.rst
@@ -12,7 +12,8 @@ imm3
 
				 
			
 
				 A bit mask which indicates request permissions.
			
 
				 
			
 
				-This operand must be specified as an :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 7 bits, but only 3 low bits are significant.
			
 
				+This operand must be specified as an :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`.
			
 
				+The value is truncated to 7 bits, but only 3 low bits are significant.
			
 
				 
			
 
				     ============ ==============================
			
 
				     Bit Number   Description
			
--- a/docs/AMDGPU/gfx8_simm16.rst
+++ b/docs/AMDGPU/gfx8_simm16.rst
@@ -10,5 +10,5 @@
 
				 imm16
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 16 bits and then sign-extended to 32 bits.
			
 
				+An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range -32768..65535.
			
 
				 
			
--- a/docs/AMDGPU/gfx8_uimm16.rst
+++ b/docs/AMDGPU/gfx8_uimm16.rst
@@ -10,5 +10,5 @@
 
				 imm16
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 16 bits and then zero-extended to 32 bits.
			
 
				+An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..65535.
			
 
				 
			
--- a/docs/AMDGPU/gfx8_waitcnt.rst
+++ b/docs/AMDGPU/gfx8_waitcnt.rst
@@ -14,29 +14,31 @@ Counts of outstanding instructions to wait for.
 
				 
			
 
				 The bits of this operand have the following meaning:
			
 
				 
			
 
				-    ============ ======================================================
			
 
				-    Bits         Description
			
 
				-    ============ ======================================================
			
 
				-    3:0          VM_CNT: vector memory operations count.
			
 
				-    6:4          EXP_CNT: export count.
			
 
				-    11:8         LGKM_CNT: LDS, GDS, Constant and Message count.
			
 
				-    ============ ======================================================
			
 
				+   ===== ================================================ ============
			
 
				+   Bits  Description                                      Value Range
			
 
				+   ===== ================================================ ============
			
 
				+   3:0   VM_CNT: vector memory operations count.          0..15
			
 
				+   6:4   EXP_CNT: export count.                           0..7
			
 
				+   11:8  LGKM_CNT: LDS, GDS, Constant and Message count.  0..15
			
 
				+   ===== ================================================ ============
			
 
				 
			
 
				-This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_synid_integer_number>`
			
 
				-or as a combination of the following symbolic helpers:
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..0xFFFF.
			
 
				+* A combination of *vmcnt*, *expcnt*, *lgkmcnt* and other values described below.
			
 
				 
			
 
				     ====================== ======================================================================
			
 
				     Syntax                 Description
			
 
				     ====================== ======================================================================
			
 
				-    vmcnt(<*N*>)           VM_CNT value. *N* must not exceed the largest VM_CNT value.
			
 
				-    expcnt(<*N*>)          EXP_CNT value. *N* must not exceed the largest EXP_CNT value.
			
 
				-    lgkmcnt(<*N*>)         LGKM_CNT value. *N* must not exceed the largest LGKM_CNT value.
			
 
				-    vmcnt_sat(<*N*>)       VM_CNT value computed as min(*N*, the largest VM_CNT value).
			
 
				-    expcnt_sat(<*N*>)      EXP_CNT value computed as min(*N*, the largest EXP_CNT value).
			
 
				-    lgkmcnt_sat(<*N*>)     LGKM_CNT value computed as min(*N*, the largest LGKM_CNT value).
			
 
				+    vmcnt(<*N*>)           A VM_CNT value. *N* must not exceed the largest VM_CNT value.
			
 
				+    expcnt(<*N*>)          An EXP_CNT value. *N* must not exceed the largest EXP_CNT value.
			
 
				+    lgkmcnt(<*N*>)         An LGKM_CNT value. *N* must not exceed the largest LGKM_CNT value.
			
 
				+    vmcnt_sat(<*N*>)       A VM_CNT value computed as min(*N*, the largest VM_CNT value).
			
 
				+    expcnt_sat(<*N*>)      An EXP_CNT value computed as min(*N*, the largest EXP_CNT value).
			
 
				+    lgkmcnt_sat(<*N*>)     An LGKM_CNT value computed as min(*N*, the largest LGKM_CNT value).
			
 
				     ====================== ======================================================================
			
 
				 
			
 
				-These helpers may be specified in any order. Ampersands and commas may be used as optional separators.
			
 
				+These values may be specified in any order. Spaces, ampersands and commas may be used as optional separators.
			
 
				 
			
 
				 *N* is either an
			
 
				 :ref:`integer number<amdgpu_synid_integer_number>` or an
			
@@ -46,10 +48,18 @@ Examples:
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-    s_waitcnt 0
			
 
				+    vm_cnt = 1
			
 
				+    exp_cnt = 2
			
 
				+    lgkm_cnt = 3
			
 
				+    cnt = vm_cnt | (exp_cnt << 4) | (lgkm_cnt << 8)
			
 
				+
			
 
				+    s_waitcnt cnt
			
 
				+    s_waitcnt 1 | (2 << 4) | (3 << 8)                          // the same as above
			
 
				+    s_waitcnt vmcnt(1) expcnt(2) lgkmcnt(3)                    // the same as above
			
 
				+    s_waitcnt vmcnt(vm_cnt) expcnt(exp_cnt) lgkmcnt(lgkm_cnt)  // the same as above
			
 
				+
			
 
				     s_waitcnt vmcnt(1)
			
 
				     s_waitcnt expcnt(2) lgkmcnt(3)
			
 
				-    s_waitcnt vmcnt(1) expcnt(2) lgkmcnt(3)
			
 
				     s_waitcnt vmcnt(1), expcnt(2), lgkmcnt(3)
			
 
				     s_waitcnt vmcnt(1) & lgkmcnt_sat(100) & expcnt(2)
			
 
				 
			
--- a/docs/AMDGPU/gfx9_bimm16.rst
+++ b/docs/AMDGPU/gfx9_bimm16.rst
@@ -10,5 +10,5 @@
 
				 imm16
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 16 bits.
			
 
				+A 16-bit :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range -32768..65535.
			
 
				 
			
--- a/docs/AMDGPU/gfx9_bimm32.rst
+++ b/docs/AMDGPU/gfx9_bimm32.rst
@@ -10,5 +10,5 @@
 
				 imm32
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 32 bits.
			
 
				+An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value is truncated to 32 bits.
			
 
				 
			
--- a/docs/AMDGPU/gfx9_data_mimg_atomic_cmp.rst
+++ b/docs/AMDGPU/gfx9_data_mimg_atomic_cmp.rst
@@ -21,7 +21,7 @@ Optionally may serve as an output data:
 
				 * :ref:`dmask<amdgpu_synid_dmask>` may specify 2 data elements for 32-bit-per-pixel surfaces or 4 data elements for 64-bit-per-pixel surfaces. Each data element occupies 1 dword.
			
 
				 * :ref:`tfe<amdgpu_synid_tfe>` adds 1 dword if specified.
			
 
				 
			
 
				-  Note. The surface data format is indicated in the image resource constant but not in the instruction.
			
 
				+  Note: the surface data format is indicated in the image resource constant but not in the instruction.
			
 
				 
			
 
				 
			
 
				 *Operands:* :ref:`v<amdgpu_synid_v>`
			
--- a/docs/AMDGPU/gfx9_data_mimg_atomic_reg.rst
+++ b/docs/AMDGPU/gfx9_data_mimg_atomic_reg.rst
@@ -21,6 +21,6 @@ Optionally may serve as an output data:
 
				 * :ref:`dmask<amdgpu_synid_dmask>` may specify 1 data element for 32-bit-per-pixel surfaces or 2 data elements for 64-bit-per-pixel surfaces. Each data element occupies 1 dword.
			
 
				 * :ref:`tfe<amdgpu_synid_tfe>` adds 1 dword if specified.
			
 
				 
			
 
				-  Note. The surface data format is indicated in the image resource constant but not in the instruction.
			
 
				+  Note: the surface data format is indicated in the image resource constant but not in the instruction.
			
 
				 
			
 
				 *Operands:* :ref:`v<amdgpu_synid_v>`
			
--- a/docs/AMDGPU/gfx9_fimm16.rst
+++ b/docs/AMDGPU/gfx9_fimm16.rst
@@ -10,5 +10,6 @@
 
				 imm32
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>` or a :ref:`floating-point_number<amdgpu_synid_floating-point_number>`. The number is converted to *f16* as described :ref:`here<amdgpu_synid_lit_conv>`.
			
 
				+A :ref:`floating-point_number<amdgpu_synid_floating-point_number>`, an :ref:`integer_number<amdgpu_synid_integer_number>`, or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`.
			
 
				+The value is converted to *f16* as described :ref:`here<amdgpu_synid_fp_conv>`.
			
 
				 
			
--- a/docs/AMDGPU/gfx9_fimm32.rst
+++ b/docs/AMDGPU/gfx9_fimm32.rst
@@ -10,5 +10,6 @@
 
				 imm32
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>` or a :ref:`floating-point_number<amdgpu_synid_floating-point_number>`. The value is converted to *f32* as described :ref:`here<amdgpu_synid_lit_conv>`.
			
 
				+A :ref:`floating-point_number<amdgpu_synid_floating-point_number>`, an :ref:`integer_number<amdgpu_synid_integer_number>`, or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`.
			
 
				+The value is converted to *f32* as described :ref:`here<amdgpu_synid_fp_conv>`.
			
 
				 
			
--- a/docs/AMDGPU/gfx9_hwreg.rst
+++ b/docs/AMDGPU/gfx9_hwreg.rst
@@ -14,18 +14,21 @@ Bits of a hardware register being accessed.
 
				 
			
 
				 The bits of this operand have the following meaning:
			
 
				 
			
 
				-    ============ ===================================
			
 
				-    Bits         Description
			
 
				-    ============ ===================================
			
 
				-    5:0          Register *id*.
			
 
				-    10:6         First bit *offset* (0..31).
			
 
				-    15:11        *Size* in bits (1..32).
			
 
				-    ============ ===================================
			
 
				+    ======= ===================== ============
			
 
				+    Bits    Description           Value Range
			
 
				+    ======= ===================== ============
			
 
				+    5:0     Register *id*.        0..63
			
 
				+    10:6    First bit *offset*.   0..31
			
 
				+    15:11   *Size* in bits.       1..32
			
 
				+    ======= ===================== ============
			
 
				 
			
 
				-This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_synid_integer_number>` or using the syntax described below.
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..0xFFFF.
			
 
				+* An *hwreg* value described below.
			
 
				 
			
 
				     ==================================== ============================================================================
			
 
				-    Syntax                               Description
			
 
				+    Hwreg Value Syntax                   Description
			
 
				     ==================================== ============================================================================
			
 
				     hwreg({0..63})                       All bits of a register indicated by its *id*.
			
 
				     hwreg(<*name*>)                      All bits of a register indicated by its *name*.
			
@@ -33,7 +36,8 @@ This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_s
 
				     hwreg(<*name*>, {0..31}, {1..32})    Register bits indicated by register *name*, first bit *offset* and *size*.
			
 
				     ==================================== ============================================================================
			
 
				 
			
 
				-Register *id*, *offset* and *size* must be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`.
			
 
				+Numeric values may be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`
			
 
				+or :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				 Defined register *names* include:
			
 
				 
			
@@ -54,7 +58,16 @@ Examples:
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-    s_getreg_b32 s2, 0x6
			
 
				+    reg = 1
			
 
				+    offset = 2
			
 
				+    size = 4
			
 
				+    hwreg_enc = reg | (offset << 6) | ((size - 1) << 11)
			
 
				+
			
 
				+    s_getreg_b32 s2, 0x1881
			
 
				+    s_getreg_b32 s2, hwreg_enc                     // the same as above
			
 
				+    s_getreg_b32 s2, hwreg(1, 2, 4)                // the same as above
			
 
				+    s_getreg_b32 s2, hwreg(reg, offset, size)      // the same as above
			
 
				+
			
 
				     s_getreg_b32 s2, hwreg(15)
			
 
				     s_getreg_b32 s2, hwreg(51, 1, 31)
			
 
				     s_getreg_b32 s2, hwreg(HW_REG_LDS_ALLOC, 0, 1)
			
--- a/docs/AMDGPU/gfx9_imask.rst
+++ b/docs/AMDGPU/gfx9_imask.rst
@@ -0,0 +1,66 @@
 
				+..
			
 
				+    **************************************************
			
 
				+    *                                                *
			
 
				+    *   Automatically generated file, do not edit!   *
			
 
				+    *                                                *
			
 
				+    **************************************************
			
 
				+
			
 
				+.. _amdgpu_synid9_imask:
			
 
				+
			
 
				+imask
			
 
				+===========================
			
 
				+
			
 
				+This operand is a mask which controls indexing mode for operands of subsequent instructions.
			
 
				+Bits 0, 1 and 2 control indexing of *src0*, *src1* and *src2*, while bit 3 controls indexing of *dst*.
			
 
				+Value 1 enables indexing and value 0 disables it.
			
 
				+
			
 
				+    ===== ========================================
			
 
				+    Bit   Meaning
			
 
				+    ===== ========================================
			
 
				+    0     Enables or disables *src0* indexing.
			
 
				+    1     Enables or disables *src1* indexing.
			
 
				+    2     Enables or disables *src2* indexing.
			
 
				+    3     Enables or disables *dst* indexing.
			
 
				+    ===== ========================================
			
 
				+
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..15.
			
 
				+* A *gpr_idx* value described below.
			
 
				+
			
 
				+    ==================================== ===========================================
			
 
				+    Gpr_idx Value Syntax                 Description
			
 
				+    ==================================== ===========================================
			
 
				+    gpr_idx(*<operands>*)                Enable indexing for specified *operands*
			
 
				+                                         and disable it for the rest.
			
 
				+                                         *Operands* is a comma-separated list of
			
 
				+                                         values which may include:
			
 
				+
			
 
				+                                         * "SRC0" - enable *src0* indexing.
			
 
				+
			
 
				+                                         * "SRC1" - enable *src1* indexing.
			
 
				+
			
 
				+                                         * "SRC2" - enable *src2* indexing.
			
 
				+
			
 
				+                                         * "DST"  - enable *dst* indexing.
			
 
				+
			
 
				+                                         Each of these values may be specified only
			
 
				+                                         once.
			
 
				+
			
 
				+                                         *Operands* list may be empty; this syntax
			
 
				+                                         disables indexing for all operands.
			
 
				+    ==================================== ===========================================
			
 
				+
			
 
				+Examples:
			
 
				+
			
 
				+.. parsed-literal::
			
 
				+
			
 
				+    s_set_gpr_idx_mode 0
			
 
				+    s_set_gpr_idx_mode gpr_idx()                        // the same as above
			
 
				+
			
 
				+    s_set_gpr_idx_mode 15
			
 
				+    s_set_gpr_idx_mode gpr_idx(DST,SRC0,SRC1,SRC2)      // the same as above
			
 
				+    s_set_gpr_idx_mode gpr_idx(SRC0,SRC1,SRC2,DST)      // the same as above
			
 
				+
			
 
				+    s_set_gpr_idx_mode gpr_idx(DST,SRC1)
			
 
				+
			
--- a/docs/AMDGPU/gfx9_imm4.rst
+++ b/docs/AMDGPU/gfx9_imm4.rst
@@ -1,25 +0,0 @@
 
				-..
			
 
				-    **************************************************
			
 
				-    *                                                *
			
 
				-    *   Automatically generated file, do not edit!   *
			
 
				-    *                                                *
			
 
				-    **************************************************
			
 
				-
			
 
				-.. _amdgpu_synid9_imm4:
			
 
				-
			
 
				-imm4
			
 
				-===========================
			
 
				-
			
 
				-A positive :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 4 bits.
			
 
				-
			
 
				-This operand is a mask which controls indexing mode for operands of subsequent instructions. Value 1 enables indexing and value 0 disables it.
			
 
				-
			
 
				-    ============ ========================================
			
 
				-    Bit          Meaning
			
 
				-    ============ ========================================
			
 
				-    0            Enables or disables *src0* indexing.
			
 
				-    1            Enables or disables *src1* indexing.
			
 
				-    2            Enables or disables *src2* indexing.
			
 
				-    3            Enables or disables *dst* indexing.
			
 
				-    ============ ========================================
			
 
				-
			
--- a/docs/AMDGPU/gfx9_label.rst
+++ b/docs/AMDGPU/gfx9_label.rst
@@ -12,19 +12,26 @@ label
 
				 
			
 
				 A branch target which is a 16-bit signed integer treated as a PC-relative dword offset.
			
 
				 
			
 
				-This operand may be specified as:
			
 
				+This operand may be specified as one of the following:
			
 
				 
			
 
				-* An :ref:`integer_number<amdgpu_synid_integer_number>`. The number is truncated to 16 bits.
			
 
				-* An :ref:`absolute_expression<amdgpu_synid_absolute_expression>` which must start with an :ref:`integer_number<amdgpu_synid_integer_number>`. The value of the expression is truncated to 16 bits.
			
 
				-* A :ref:`symbol<amdgpu_synid_symbol>` (for example, a label). The value is handled as a 16-bit PC-relative dword offset to be resolved by a linker.
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range -32768..65535.
			
 
				+* A :ref:`symbol<amdgpu_synid_symbol>` (for example, a label) representing a relocatable address in the same compilation unit where it is referred from. The value is handled as a 16-bit PC-relative dword offset to be resolved by a linker.
			
 
				 
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				   offset = 30
			
 
				-  s_branch loop_end
			
 
				-  s_branch 2 + offset
			
 
				+  label_1:
			
 
				+  label_2 = . + 4
			
 
				+
			
 
				   s_branch 32
			
 
				-  loop_end:
			
 
				+  s_branch offset + 2
			
 
				+  s_branch label_1
			
 
				+  s_branch label_2
			
 
				+  s_branch label_3
			
 
				+  s_branch label_4
			
 
				+
			
 
				+  label_3 = label_2 + 4
			
 
				+  label_4:
			
 
				 
			
--- a/docs/AMDGPU/gfx9_msg.rst
+++ b/docs/AMDGPU/gfx9_msg.rst
@@ -12,24 +12,29 @@ msg
 
				 
			
 
				 A 16-bit message code. The bits of this operand have the following meaning:
			
 
				 
			
 
				-    ============ ======================================================
			
 
				-    Bits         Description
			
 
				-    ============ ======================================================
			
 
				-    3:0          Message *type*.
			
 
				-    6:4          Optional *operation*.
			
 
				-    9:7          Optional *parameters*.
			
 
				-    15:10        Unused.
			
 
				-    ============ ======================================================
			
 
				-
			
 
				-This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_synid_integer_number>` or using the syntax described below:
			
 
				-
			
 
				-    ======================================== ========================================================================
			
 
				-    Syntax                                   Description
			
 
				-    ======================================== ========================================================================
			
 
				-    sendmsg(<*type*>)                        A message identified by its *type*.
			
 
				-    sendmsg(<*type*>, <*op*>)                A message identified by its *type* and *operation*.
			
 
				-    sendmsg(<*type*>, <*op*>, <*stream*>)    A message identified by its *type* and *operation* with a stream *id*.
			
 
				-    ======================================== ========================================================================
			
 
				+    ============ =============================== ===============
			
 
				+    Bits         Description                     Value Range
			
 
				+    ============ =============================== ===============
			
 
				+    3:0          Message *type*.                 0..15
			
 
				+    6:4          Optional *operation*.           0..7
			
 
				+    7:7          Unused.                         \-
			
 
				+    9:8          Optional *stream*.              0..3
			
 
				+    15:10        Unused.                         \-
			
 
				+    ============ =============================== ===============
			
 
				+
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..0xFFFF.
			
 
				+* A *sendmsg* value described below.
			
 
				+
			
 
				+    ==================================== ====================================================
			
 
				+    Sendmsg Value Syntax                 Description
			
 
				+    ==================================== ====================================================
			
 
				+    sendmsg(<*type*>)                    A message identified by its *type*.
			
 
				+    sendmsg(<*type*>,<*op*>)             A message identified by its *type* and *operation*.
			
 
				+    sendmsg(<*type*>,<*op*>,<*stream*>)  A message identified by its *type* and *operation*
			
 
				+                                         with a stream *id*.
			
 
				+    ==================================== ====================================================
			
 
				 
			
 
				 *Type* may be specified using message *name* or message *id*.
			
 
				 
			
@@ -37,7 +42,8 @@ This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_s
 
				 
			
 
				 Stream *id* is an integer in the range 0..3.
			
 
				 
			
 
				-Message *id*, operation *id* and stream *id* must be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`.
			
 
				+Numeric values may be specified as positive :ref:`integer numbers<amdgpu_synid_integer_number>`
			
 
				+or :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				 Each message type supports specific operations:
			
 
				 
			
@@ -60,16 +66,32 @@ Each message type supports specific operations:
 
				     \                            SYSMSG_OP_TTRACE_PC            4            \-
			
 
				     ================= ========== ============================== ============ ==========
			
 
				 
			
 
				+*Sendmsg* arguments are validated depending on how *type* value is specified:
			
 
				+
			
 
				+* If message *type* is specified by name, arguments values must satisfy limitations detailed in the table above.
			
 
				+* If message *type* is specified as a number, each argument must not exceed corresponding value range (see the first table).
			
 
				+
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				+    // numeric message code
			
 
				+    msg = 0x10
			
 
				     s_sendmsg 0x12
			
 
				+    s_sendmsg msg + 2
			
 
				+
			
 
				+    // sendmsg with strict arguments validation
			
 
				     s_sendmsg sendmsg(MSG_INTERRUPT)
			
 
				-    s_sendmsg sendmsg(MSG_GET_DOORBELL)
			
 
				-    s_sendmsg sendmsg(2, GS_OP_CUT)
			
 
				     s_sendmsg sendmsg(MSG_GS, GS_OP_EMIT)
			
 
				     s_sendmsg sendmsg(MSG_GS, 2)
			
 
				     s_sendmsg sendmsg(MSG_GS_DONE, GS_OP_EMIT_CUT, 1)
			
 
				     s_sendmsg sendmsg(MSG_SYSMSG, SYSMSG_OP_TTRACE_PC)
			
 
				+    s_sendmsg sendmsg(MSG_GET_DOORBELL)
			
 
				+
			
 
				+    // sendmsg with validation of value range only
			
 
				+    msg = 2
			
 
				+    op = 3
			
 
				+    stream = 1
			
 
				+    s_sendmsg sendmsg(msg, op, stream)
			
 
				+    s_sendmsg sendmsg(2, GS_OP_CUT)
			
 
				 
			
--- a/docs/AMDGPU/gfx9_perm_smem.rst
+++ b/docs/AMDGPU/gfx9_perm_smem.rst
@@ -12,7 +12,8 @@ imm3
 
				 
			
 
				 A bit mask which indicates request permissions.
			
 
				 
			
 
				-This operand must be specified as an :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 7 bits, but only 3 low bits are significant.
			
 
				+This operand must be specified as an :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`.
			
 
				+The value is truncated to 7 bits, but only 3 low bits are significant.
			
 
				 
			
 
				     ============ ==============================
			
 
				     Bit Number   Description
			
--- a/docs/AMDGPU/gfx9_simm16.rst
+++ b/docs/AMDGPU/gfx9_simm16.rst
@@ -10,5 +10,5 @@
 
				 imm16
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 16 bits and then sign-extended to 32 bits.
			
 
				+An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range -32768..65535.
			
 
				 
			
--- a/docs/AMDGPU/gfx9_uimm16.rst
+++ b/docs/AMDGPU/gfx9_uimm16.rst
@@ -10,5 +10,5 @@
 
				 imm16
			
 
				 ===========================
			
 
				 
			
 
				-An :ref:`integer_number<amdgpu_synid_integer_number>`. The value is truncated to 16 bits and then zero-extended to 32 bits.
			
 
				+An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..65535.
			
 
				 
			
--- a/docs/AMDGPU/gfx9_waitcnt.rst
+++ b/docs/AMDGPU/gfx9_waitcnt.rst
@@ -14,30 +14,31 @@ Counts of outstanding instructions to wait for.
 
				 
			
 
				 The bits of this operand have the following meaning:
			
 
				 
			
 
				-    ============ ======================================================
			
 
				-    Bits         Description
			
 
				-    ============ ======================================================
			
 
				-    3:0          VM_CNT: vector memory operations count, lower bits.
			
 
				-    6:4          EXP_CNT: export count.
			
 
				-    11:8         LGKM_CNT: LDS, GDS, Constant and Message count.
			
 
				-    15:14        VM_CNT: vector memory operations count, upper bits.
			
 
				-    ============ ======================================================
			
 
				-
			
 
				-This operand may be specified as a positive 16-bit :ref:`integer_number<amdgpu_synid_integer_number>`
			
 
				-or as a combination of the following symbolic helpers:
			
 
				+    ========== ========= ================================================ ============
			
 
				+    High Bits  Low Bits  Description                                      Value Range
			
 
				+    ========== ========= ================================================ ============
			
 
				+    15:14      3:0       VM_CNT: vector memory operations count.          0..63
			
 
				+    \-         6:4       EXP_CNT: export count.                           0..7
			
 
				+    \-         11:8      LGKM_CNT: LDS, GDS, Constant and Message count.  0..15
			
 
				+    ========== ========= ================================================ ============
			
 
				+
			
 
				+This operand may be specified as one of the following:
			
 
				+
			
 
				+* An :ref:`integer_number<amdgpu_synid_integer_number>` or an :ref:`absolute_expression<amdgpu_synid_absolute_expression>`. The value must be in the range 0..0xFFFF.
			
 
				+* A combination of *vmcnt*, *expcnt*, *lgkmcnt* and other values described below.
			
 
				 
			
 
				     ====================== ======================================================================
			
 
				     Syntax                 Description
			
 
				     ====================== ======================================================================
			
 
				-    vmcnt(<*N*>)           VM_CNT value. *N* must not exceed the largest VM_CNT value.
			
 
				-    expcnt(<*N*>)          EXP_CNT value. *N* must not exceed the largest EXP_CNT value.
			
 
				-    lgkmcnt(<*N*>)         LGKM_CNT value. *N* must not exceed the largest LGKM_CNT value.
			
 
				-    vmcnt_sat(<*N*>)       VM_CNT value computed as min(*N*, the largest VM_CNT value).
			
 
				-    expcnt_sat(<*N*>)      EXP_CNT value computed as min(*N*, the largest EXP_CNT value).
			
 
				-    lgkmcnt_sat(<*N*>)     LGKM_CNT value computed as min(*N*, the largest LGKM_CNT value).
			
 
				+    vmcnt(<*N*>)           A VM_CNT value. *N* must not exceed the largest VM_CNT value.
			
 
				+    expcnt(<*N*>)          An EXP_CNT value. *N* must not exceed the largest EXP_CNT value.
			
 
				+    lgkmcnt(<*N*>)         An LGKM_CNT value. *N* must not exceed the largest LGKM_CNT value.
			
 
				+    vmcnt_sat(<*N*>)       A VM_CNT value computed as min(*N*, the largest VM_CNT value).
			
 
				+    expcnt_sat(<*N*>)      An EXP_CNT value computed as min(*N*, the largest EXP_CNT value).
			
 
				+    lgkmcnt_sat(<*N*>)     An LGKM_CNT value computed as min(*N*, the largest LGKM_CNT value).
			
 
				     ====================== ======================================================================
			
 
				 
			
 
				-These helpers may be specified in any order. Ampersands and commas may be used as optional separators.
			
 
				+These values may be specified in any order. Spaces, ampersands and commas may be used as optional separators.
			
 
				 
			
 
				 *N* is either an
			
 
				 :ref:`integer number<amdgpu_synid_integer_number>` or an
			
@@ -47,10 +48,18 @@ Examples:
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-    s_waitcnt 0
			
 
				+    vm_cnt = 1
			
 
				+    exp_cnt = 2
			
 
				+    lgkm_cnt = 3
			
 
				+    cnt = vm_cnt | (exp_cnt << 4) | (lgkm_cnt << 8)
			
 
				+
			
 
				+    s_waitcnt cnt
			
 
				+    s_waitcnt 1 | (2 << 4) | (3 << 8)                          // the same as above
			
 
				+    s_waitcnt vmcnt(1) expcnt(2) lgkmcnt(3)                    // the same as above
			
 
				+    s_waitcnt vmcnt(vm_cnt) expcnt(exp_cnt) lgkmcnt(lgkm_cnt)  // the same as above
			
 
				+
			
 
				     s_waitcnt vmcnt(1)
			
 
				     s_waitcnt expcnt(2) lgkmcnt(3)
			
 
				-    s_waitcnt vmcnt(1) expcnt(2) lgkmcnt(3)
			
 
				     s_waitcnt vmcnt(1), expcnt(2), lgkmcnt(3)
			
 
				     s_waitcnt vmcnt(1) & lgkmcnt_sat(100) & expcnt(2)
			
 
				 
			
--- a/docs/AMDGPUModifierSyntax.rst
+++ b/docs/AMDGPUModifierSyntax.rst
@@ -34,19 +34,21 @@ Specifies an immediate unsigned 8-bit offset, in bytes. The default value is 0.
 
				 
			
 
				 Used with DS instructions which have 2 addresses.
			
 
				 
			
 
				-    =================== =====================================================
			
 
				+    =================== ====================================================================
			
 
				     Syntax              Description
			
 
				-    =================== =====================================================
			
 
				+    =================== ====================================================================
			
 
				     offset:{0..0xFF}    Specifies an unsigned 8-bit offset as a positive
			
 
				-                        :ref:`integer number <amdgpu_synid_integer_number>`.
			
 
				-    =================== =====================================================
			
 
				+                        :ref:`integer number <amdgpu_synid_integer_number>`
			
 
				+                        or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				+    =================== ====================================================================
			
 
				 
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-  offset:255
			
 
				   offset:0xff
			
 
				+  offset:2-x
			
 
				+  offset:-x-y
			
 
				 
			
 
				 .. _amdgpu_synid_ds_offset16:
			
 
				 
			
@@ -57,12 +59,13 @@ Specifies an immediate unsigned 16-bit offset, in bytes. The default value is 0.
 
				 
			
 
				 Used with DS instructions which have 1 address.
			
 
				 
			
 
				-    ==================== ======================================================
			
 
				+    ==================== ====================================================================
			
 
				     Syntax               Description
			
 
				-    ==================== ======================================================
			
 
				+    ==================== ====================================================================
			
 
				     offset:{0..0xFFFF}   Specifies an unsigned 16-bit offset as a positive
			
 
				-                         :ref:`integer number <amdgpu_synid_integer_number>`.
			
 
				-    ==================== ======================================================
			
 
				+                         :ref:`integer number <amdgpu_synid_integer_number>`
			
 
				+                         or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				+    ==================== ====================================================================
			
 
				 
			
 
				 Examples:
			
 
				 
			
@@ -70,6 +73,7 @@ Examples:
 
				 
			
 
				   offset:65535
			
 
				   offset:0xffff
			
 
				+  offset:-x-y
			
 
				 
			
 
				 .. _amdgpu_synid_sw_offset16:
			
 
				 
			
@@ -95,7 +99,7 @@ See AMD documentation for more information.
 
				 
			
 
				                                                             *mask* is a 5 character sequence which
			
 
				                                                             specifies how to transform the bits of the
			
 
				-                                                            lane *id*. 
			
 
				+                                                            lane *id*.
			
 
				 
			
 
				                                                             The following characters are allowed:
			
 
				 
			
@@ -116,7 +120,7 @@ See AMD documentation for more information.
 
				                                                             size and must be equal to 2, 4, 8, 16 or 32.
			
 
				 
			
 
				                                                             The second numeric parameter is an index of the
			
 
				-                                                            lane being broadcasted. 
			
 
				+                                                            lane being broadcasted.
			
 
				 
			
 
				                                                             The index must not exceed group size.
			
 
				     offset:swizzle(SWAP,{1..16})                            Specifies a swap mode.
			
@@ -128,7 +132,7 @@ See AMD documentation for more information.
 
				                                                             Reverses the lanes for groups of 2, 4, 8, 16 or 32 lanes.
			
 
				     ======================================================= ===========================================================
			
 
				 
			
 
				-Numeric parameters may be specified as either :ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				+Note: numeric values may be specified as either :ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				 :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				 Examples:
			
@@ -137,7 +141,7 @@ Examples:
 
				 
			
 
				   offset:255
			
 
				   offset:0xffff
			
 
				-  offset:swizzle(QUAD_PERM, 0, 1, 2 ,3)
			
 
				+  offset:swizzle(QUAD_PERM, 0, 1, 2, 3)
			
 
				   offset:swizzle(BITMASK_PERM, "01pi0")
			
 
				   offset:swizzle(BROADCAST, 2, 0)
			
 
				   offset:swizzle(SWAP, 8)
			
@@ -212,19 +216,20 @@ Specifies an immediate unsigned 12-bit offset, in bytes. The default value is 0.
 
				 
			
 
				 Cannot be used with *global/scratch* opcodes. GFX9 only.
			
 
				 
			
 
				-    ================= ======================================================
			
 
				+    ================= ====================================================================
			
 
				     Syntax            Description
			
 
				-    ================= ======================================================
			
 
				+    ================= ====================================================================
			
 
				     offset:{0..4095}  Specifies a 12-bit unsigned offset as a positive
			
 
				-                      :ref:`integer number <amdgpu_synid_integer_number>`.
			
 
				-    ================= ======================================================
			
 
				+                      :ref:`integer number <amdgpu_synid_integer_number>`
			
 
				+                      or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				+    ================= ====================================================================
			
 
				 
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				   offset:4095
			
 
				-  offset:0xff
			
 
				+  offset:x-0xff
			
 
				 
			
 
				 .. _amdgpu_synid_flat_offset13s:
			
 
				 
			
@@ -235,12 +240,13 @@ Specifies an immediate signed 13-bit offset, in bytes. The default value is 0.
 
				 
			
 
				 Can be used with *global/scratch* opcodes only. GFX9 only.
			
 
				 
			
 
				-    ============================ =======================================================
			
 
				-    Syntax                       Description
			
 
				-    ============================ =======================================================
			
 
				-    offset:{-4096..4095}         Specifies a 13-bit signed offset as an
			
 
				-                                 :ref:`integer number <amdgpu_synid_integer_number>`.
			
 
				-    ============================ =======================================================
			
 
				+    ===================== ====================================================================
			
 
				+    Syntax                Description
			
 
				+    ===================== ====================================================================
			
 
				+    offset:{-4096..4095}  Specifies a 13-bit signed offset as an
			
 
				+                          :ref:`integer number <amdgpu_synid_integer_number>`
			
 
				+                          or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				+    ===================== ====================================================================
			
 
				 
			
 
				 Examples:
			
 
				 
			
@@ -248,6 +254,7 @@ Examples:
 
				 
			
 
				   offset:-4000
			
 
				   offset:0x10
			
 
				+  offset:-x
			
 
				 
			
 
				 .. _amdgpu_synid_flat_offset12s:
			
 
				 
			
@@ -260,12 +267,13 @@ Can be used with *global/scratch* opcodes only.
 
				 
			
 
				 GFX10 only.
			
 
				 
			
 
				-    ============================ =======================================================
			
 
				-    Syntax                       Description
			
 
				-    ============================ =======================================================
			
 
				-    offset:{-2048..2047}         Specifies a 12-bit signed offset as an
			
 
				-                                 :ref:`integer number <amdgpu_synid_integer_number>`.
			
 
				-    ============================ =======================================================
			
 
				+    ===================== ====================================================================
			
 
				+    Syntax                Description
			
 
				+    ===================== ====================================================================
			
 
				+    offset:{-2048..2047}  Specifies a 12-bit signed offset as an
			
 
				+                          :ref:`integer number <amdgpu_synid_integer_number>`
			
 
				+                          or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				+    ===================== ====================================================================
			
 
				 
			
 
				 Examples:
			
 
				 
			
@@ -273,6 +281,7 @@ Examples:
 
				 
			
 
				   offset:-2000
			
 
				   offset:0x10
			
 
				+  offset:-x+y
			
 
				 
			
 
				 .. _amdgpu_synid_flat_offset11:
			
 
				 
			
@@ -285,19 +294,20 @@ Cannot be used with *global/scratch* opcodes.
 
				 
			
 
				 GFX10 only.
			
 
				 
			
 
				-    ================= ======================================================
			
 
				+    ================= ====================================================================
			
 
				     Syntax            Description
			
 
				-    ================= ======================================================
			
 
				+    ================= ====================================================================
			
 
				     offset:{0..2047}  Specifies an 11-bit unsigned offset as a positive
			
 
				-                      :ref:`integer number <amdgpu_synid_integer_number>`.
			
 
				-    ================= ======================================================
			
 
				+                      :ref:`integer number <amdgpu_synid_integer_number>`
			
 
				+                      or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				+    ================= ====================================================================
			
 
				 
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				   offset:2047
			
 
				-  offset:0xff
			
 
				+  offset:x+0xff
			
 
				 
			
 
				 dlc
			
 
				 ~~~
			
@@ -340,19 +350,18 @@ dmask
 
				 Specifies which channels (image components) are used by the operation. By default, no channels
			
 
				 are used.
			
 
				 
			
 
				-    =============== =====================================================
			
 
				+    =============== ====================================================================
			
 
				     Syntax          Description
			
 
				-    =============== =====================================================
			
 
				+    =============== ====================================================================
			
 
				     dmask:{0..15}   Specifies image channels as a positive
			
 
				-                    :ref:`integer number <amdgpu_synid_integer_number>`.
			
 
				+                    :ref:`integer number <amdgpu_synid_integer_number>`
			
 
				+                    or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				-                    Each bit corresponds to one of 4 image
			
 
				-                    components (RGBA).
			
 
				+                    Each bit corresponds to one of 4 image components (RGBA).
			
 
				 
			
 
				-                    If the specified bit value
			
 
				-                    is 0, the component is not used, value 1 means
			
 
				-                    that the component is used.
			
 
				-    =============== =====================================================
			
 
				+                    If the specified bit value is 0, the component is not used,
			
 
				+                    value 1 means that the component is used.
			
 
				+    =============== ====================================================================
			
 
				 
			
 
				 This modifier has some limitations depending on instruction kind:
			
 
				 
			
@@ -373,7 +382,7 @@ Examples:
 
				 
			
 
				   dmask:0xf
			
 
				   dmask:0b1111
			
 
				-  dmask:3
			
 
				+  dmask:x|y|z
			
 
				 
			
 
				 .. _amdgpu_synid_unorm:
			
 
				 
			
@@ -468,7 +477,7 @@ Specifies data size: 16 or 32 bits (32 bits by default). Not supported by GFX7.
 
				                                              Each 16-bit data element occupies 1 VGPR.
			
 
				 
			
 
				                                              GFX8.1, GFX9 and GFX10 support data packing.
			
 
				-                                             Each pair of 16-bit data elements 
			
 
				+                                             Each pair of 16-bit data elements
			
 
				                                              occupies 1 VGPR.
			
 
				     ======================================== ================================================
			
 
				 
			
@@ -684,18 +693,19 @@ offset12
 
				 
			
 
				 Specifies an immediate unsigned 12-bit offset, in bytes. The default value is 0.
			
 
				 
			
 
				-    =============================== ======================================================
			
 
				-    Syntax                          Description
			
 
				-    =============================== ======================================================
			
 
				-    offset:{0..0xFFF}               Specifies a 12-bit unsigned offset as a positive
			
 
				-                                    :ref:`integer number <amdgpu_synid_integer_number>`.
			
 
				-    =============================== ======================================================
			
 
				+    ================== ====================================================================
			
 
				+    Syntax             Description
			
 
				+    ================== ====================================================================
			
 
				+    offset:{0..0xFFF}  Specifies a 12-bit unsigned offset as a positive
			
 
				+                       :ref:`integer number <amdgpu_synid_integer_number>`
			
 
				+                       or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				+    ================== ====================================================================
			
 
				 
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-  offset:0
			
 
				+  offset:x+y
			
 
				   offset:0x10
			
 
				 
			
 
				 glc
			
@@ -782,14 +792,18 @@ GFX10 only.
 
				 dpp8_sel
			
 
				 ~~~~~~~~
			
 
				 
			
 
				-Selects which lane to pull data from, within a group of 8 lanes. This is a mandatory modifier.
			
 
				+Selects which lanes to pull data from, within a group of 8 lanes. This is a mandatory modifier.
			
 
				 There is no default value.
			
 
				 
			
 
				 GFX10 only.
			
 
				 
			
 
				-The *dpp8_sel* modifier must specify exactly 8 values, each ranging from 0 to 7.
			
 
				+The *dpp8_sel* modifier must specify exactly 8 values.
			
 
				 First value selects which lane to read from to supply data into lane 0.
			
 
				-Second value controls value for lane 1 and so on.
			
 
				+Second value controls lane 1 and so on.
			
 
				+
			
 
				+Each value may be specified as either
			
 
				+an :ref:`integer number<amdgpu_synid_integer_number>` or
			
 
				+an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				     =============================================================== ===========================
			
 
				     Syntax                                                          Description
			
@@ -811,7 +825,7 @@ fi
 
				 
			
 
				 Controls interaction with inactive lanes for *dpp8* instructions. The default value is zero.
			
 
				 
			
 
				-Note. *Inactive* lanes are those whose :ref:`exec<amdgpu_synid_exec>` mask bit is zero.
			
 
				+Note: *inactive* lanes are those whose :ref:`exec<amdgpu_synid_exec>` mask bit is zero.
			
 
				 
			
 
				 GFX10 only.
			
 
				 
			
@@ -822,6 +836,9 @@ GFX10 only.
 
				     fi:1                                 Fetch pre-exist values from inactive lanes.
			
 
				     ==================================== =====================================================
			
 
				 
			
 
				+Note: numeric values may be specified as either :ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				+:ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				 DPP/DPP16 Modifiers
			
 
				 -------------------
			
 
				 
			
@@ -837,7 +854,7 @@ There is no default value.
 
				 
			
 
				 GFX8 and GFX9 only. Use :ref:`dpp16_ctrl<amdgpu_synid_dpp16_ctrl>` for GFX10.
			
 
				 
			
 
				-Note. The lanes of a wavefront are organized in four *rows* and four *banks*.
			
 
				+Note: the lanes of a wavefront are organized in four *rows* and four *banks*.
			
 
				 
			
 
				     ======================================== ================================================
			
 
				     Syntax                                   Description
			
@@ -856,7 +873,7 @@ Note. The lanes of a wavefront are organized in four *rows* and four *banks*.
 
				     row_ror:{1..15}                          Row rotate right by 1-15 threads.
			
 
				     ======================================== ================================================
			
 
				 
			
 
				-Note: Numeric parameters may be specified as either
			
 
				+Note: numeric values may be specified as either
			
 
				 :ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				 :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				 
			
@@ -877,7 +894,7 @@ There is no default value.
 
				 
			
 
				 GFX10 only. Use :ref:`dpp_ctrl<amdgpu_synid_dpp_ctrl>` for GFX8 and GFX9.
			
 
				 
			
 
				-Note. The lanes of a wavefront are organized in four *rows* and four *banks*.
			
 
				+Note: the lanes of a wavefront are organized in four *rows* and four *banks*.
			
 
				 (There are only two rows in *wave32* mode.)
			
 
				 
			
 
				     ======================================== ====================================================
			
@@ -894,7 +911,7 @@ Note. The lanes of a wavefront are organized in four *rows* and four *banks*.
 
				     row_ror:{1..15}                          Row rotate right by 1-15 threads.
			
 
				     ======================================== ====================================================
			
 
				 
			
 
				-Note: Numeric parameters may be specified as either
			
 
				+Note: numeric values may be specified as either
			
 
				 :ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				 :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				 
			
@@ -912,21 +929,21 @@ row_mask
 
				 
			
 
				 Controls which rows are enabled for data sharing. By default, all rows are enabled.
			
 
				 
			
 
				-Note. The lanes of a wavefront are organized in four *rows* and four *banks*.
			
 
				+Note: the lanes of a wavefront are organized in four *rows* and four *banks*.
			
 
				 (There are only two rows in *wave32* mode.)
			
 
				 
			
 
				-    ======================================== =====================================================
			
 
				-    Syntax                                   Description
			
 
				-    ======================================== =====================================================
			
 
				-    row_mask:{0..15}                         Specifies a *row mask* as a positive
			
 
				-                                             :ref:`integer number <amdgpu_synid_integer_number>`.
			
 
				+    ================= ====================================================================
			
 
				+    Syntax            Description
			
 
				+    ================= ====================================================================
			
 
				+    row_mask:{0..15}  Specifies a *row mask* as a positive
			
 
				+                      :ref:`integer number <amdgpu_synid_integer_number>`
			
 
				+                      or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				-                                             Each of 4 bits in the mask controls one
			
 
				-                                             row (0 - disabled, 1 - enabled).
			
 
				+                      Each of 4 bits in the mask controls one row
			
 
				+                      (0 - disabled, 1 - enabled).
			
 
				 
			
 
				-                                             In *wave32* mode the values should be limited to
			
 
				-                                             {0..7}.
			
 
				-    ======================================== =====================================================
			
 
				+                      In *wave32* mode the values should be limited to 0..7.
			
 
				+    ================= ====================================================================
			
 
				 
			
 
				 Examples:
			
 
				 
			
@@ -934,7 +951,7 @@ Examples:
 
				 
			
 
				   row_mask:0xf
			
 
				   row_mask:0b1010
			
 
				-  row_mask:0b1111
			
 
				+  row_mask:x|y
			
 
				 
			
 
				 .. _amdgpu_synid_bank_mask:
			
 
				 
			
@@ -943,18 +960,19 @@ bank_mask
 
				 
			
 
				 Controls which banks are enabled for data sharing. By default, all banks are enabled.
			
 
				 
			
 
				-Note. The lanes of a wavefront are organized in four *rows* and four *banks*.
			
 
				+Note: the lanes of a wavefront are organized in four *rows* and four *banks*.
			
 
				 (There are only two rows in *wave32* mode.)
			
 
				 
			
 
				-    ======================================== =======================================================
			
 
				-    Syntax                                   Description
			
 
				-    ======================================== =======================================================
			
 
				-    bank_mask:{0..15}                        Specifies a *bank mask* as a positive
			
 
				-                                             :ref:`integer number <amdgpu_synid_integer_number>`.
			
 
				+    ================== ====================================================================
			
 
				+    Syntax             Description
			
 
				+    ================== ====================================================================
			
 
				+    bank_mask:{0..15}  Specifies a *bank mask* as a positive
			
 
				+                       :ref:`integer number <amdgpu_synid_integer_number>`
			
 
				+                       or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				 
			
 
				-                                             Each of 4 bits in the mask controls one
			
 
				-                                             bank (0 - disabled, 1 - enabled).
			
 
				-    ======================================== =======================================================
			
 
				+                       Each of 4 bits in the mask controls one bank
			
 
				+                       (0 - disabled, 1 - enabled).
			
 
				+    ================== ====================================================================
			
 
				 
			
 
				 Examples:
			
 
				 
			
@@ -962,7 +980,7 @@ Examples:
 
				 
			
 
				   bank_mask:0x3
			
 
				   bank_mask:0b0011
			
 
				-  bank_mask:0b1111
			
 
				+  bank_mask:x&y
			
 
				 
			
 
				 .. _amdgpu_synid_bound_ctrl:
			
 
				 
			
@@ -988,7 +1006,7 @@ fi
 
				 
			
 
				 Controls interaction with *inactive* lanes for *dpp16* instructions. The default value is zero.
			
 
				 
			
 
				-Note. *Inactive* lanes are those whose :ref:`exec<amdgpu_synid_exec>` mask bit is zero.
			
 
				+Note: *inactive* lanes are those whose :ref:`exec<amdgpu_synid_exec>` mask bit is zero.
			
 
				 
			
 
				 GFX10 only.
			
 
				 
			
@@ -1001,6 +1019,9 @@ GFX10 only.
 
				     fi:1                                     Fetch pre-exist values from inactive lanes.
			
 
				     ======================================== ==================================================
			
 
				 
			
 
				+Note: numeric values may be specified as either :ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				+:ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				 SDWA Modifiers
			
 
				 --------------
			
 
				 
			
@@ -1037,7 +1058,6 @@ Selects which bits in the destination are affected. By default, all bits are aff
 
				     dst_sel:WORD_1                           Use bits 31:16.
			
 
				     ======================================== ================================================
			
 
				 
			
 
				-
			
 
				 .. _amdgpu_synid_dst_unused:
			
 
				 
			
 
				 dst_unused
			
@@ -1151,7 +1171,7 @@ operands (both source and destination). First value controls src0, second value
 
				 and so on, except that the last value controls destination.
			
 
				 The value 0 selects the low bits, while 1 selects the high bits.
			
 
				 
			
 
				-Note. op_sel modifier affects 16-bit operands only. For 32-bit operands the value specified
			
 
				+Note: op_sel modifier affects 16-bit operands only. For 32-bit operands the value specified
			
 
				 by op_sel must be 0.
			
 
				 
			
 
				 GFX9 and GFX10 only.
			
@@ -1164,6 +1184,10 @@ GFX9 and GFX10 only.
 
				     op_sel:[{0..1},{0..1},{0..1},{0..1}]     Select operand bits for instructions with 3 source operands.
			
 
				     ======================================== ============================================================
			
 
				 
			
 
				+Note: numeric values may be specified as either
			
 
				+:ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				+:ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
@@ -1189,7 +1213,7 @@ Integer clamping is not supported by GFX7.
 
				 For floating point operations, clamp modifier indicates that the result must be clamped
			
 
				 to the range [0.0, 1.0]. By default, there is no clamping.
			
 
				 
			
 
				-Note. Clamp modifier is applied after :ref:`output modifiers<amdgpu_synid_omod>` (if any).
			
 
				+Note: clamp modifier is applied after :ref:`output modifiers<amdgpu_synid_omod>` (if any).
			
 
				 
			
 
				     ======================================== ================================================
			
 
				     Syntax                                   Description
			
@@ -1205,12 +1229,12 @@ omod
 
				 Specifies if an output modifier must be applied to the result.
			
 
				 By default, no output modifiers are applied.
			
 
				 
			
 
				-Note. Output modifiers are applied before :ref:`clamping<amdgpu_synid_clamp>` (if any).
			
 
				+Note: output modifiers are applied before :ref:`clamping<amdgpu_synid_clamp>` (if any).
			
 
				 
			
 
				 Output modifiers are valid for f32 and f64 floating point results only.
			
 
				 They must not be used with f16.
			
 
				 
			
 
				-Note. *v_cvt_f16_f32* is an exception. This instruction produces f16 result
			
 
				+Note: *v_cvt_f16_f32* is an exception. This instruction produces f16 result
			
 
				 but accepts output modifiers.
			
 
				 
			
 
				     ======================================== ================================================
			
@@ -1221,6 +1245,16 @@ but accepts output modifiers.
 
				     div:2                                    Multiply the result by 0.5.
			
 
				     ======================================== ================================================
			
 
				 
			
 
				+Note: numeric values may be specified as either :ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				+:ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				+Examples:
			
 
				+
			
 
				+.. parsed-literal::
			
 
				+
			
 
				+  mul:2
			
 
				+  mul:x      // x must be equal to 2 or 4
			
 
				+
			
 
				 .. _amdgpu_synid_vop3_operand_modifiers:
			
 
				 
			
 
				 VOP3 Operand Modifiers
			
@@ -1233,15 +1267,19 @@ Operand modifiers are not used separately. They are applied to source operands.
 
				 abs
			
 
				 ~~~
			
 
				 
			
 
				-Computes absolute value of its operand. Applied before :ref:`neg<amdgpu_synid_neg>` (if any).
			
 
				-Valid for floating point operands only.
			
 
				+Computes the absolute value of its operand. Must be applied before :ref:`neg<amdgpu_synid_neg>`
			
 
				+(if any). Valid for floating point operands only.
			
 
				 
			
 
				-    ======================================== ================================================
			
 
				+    ======================================== ====================================================
			
 
				     Syntax                                   Description
			
 
				-    ======================================== ================================================
			
 
				-    abs(<operand>)                           Get absolute value of operand.
			
 
				-    \|<operand>|                             The same as above.
			
 
				-    ======================================== ================================================
			
 
				+    ======================================== ====================================================
			
 
				+    abs(<operand>)                           Get the absolute value of a floating-point operand.
			
 
				+    \|<operand>|                             The same as above (an SP3 syntax).
			
 
				+    ======================================== ====================================================
			
 
				+
			
 
				+Note: avoid using SP3 syntax with operands specified as expressions because the trailing '|'
			
 
				+may be misinterpreted. Such operands should be enclosed into additional parentheses as shown
			
 
				+in examples below.
			
 
				 
			
 
				 Examples:
			
 
				 
			
@@ -1249,28 +1287,50 @@ Examples:
 
				 
			
 
				   abs(v36)
			
 
				   \|v36|
			
 
				+  abs(x|y)     // ok
			
 
				+  \|(x|y)|      // additional parentheses are required
			
 
				 
			
 
				 .. _amdgpu_synid_neg:
			
 
				 
			
 
				 neg
			
 
				 ~~~
			
 
				 
			
 
				-Computes negative value of its operand. Applied after :ref:`abs<amdgpu_synid_abs>` (if any).
			
 
				-Valid for floating point operands only.
			
 
				+Computes the negative value of its operand. Must be applied after :ref:`abs<amdgpu_synid_abs>`
			
 
				+(if any). Valid for floating point operands only.
			
 
				 
			
 
				-    ======================================== ================================================
			
 
				-    Syntax                                   Description
			
 
				-    ======================================== ================================================
			
 
				-    neg(<operand>)                           Get negative value of operand.
			
 
				-    -<operand>                               The same as above.
			
 
				-    ======================================== ================================================
			
 
				+    ================== ====================================================
			
 
				+    Syntax             Description
			
 
				+    ================== ====================================================
			
 
				+    neg(<operand>)     Get the negative value of a floating-point operand.
			
 
				+                       The operand may include an optional
			
 
				+                       :ref:`abs<amdgpu_synid_abs>` modifier.
			
 
				+    -<operand>         The same as above (an SP3 syntax).
			
 
				+    ================== ====================================================
			
 
				+
			
 
				+Note: SP3 syntax is supported with limitations because of a potential ambiguity.
			
 
				+Currently it is allowed in the following cases:
			
 
				+
			
 
				+* Before a register.
			
 
				+* Before an :ref:`abs<amdgpu_synid_abs>` modifier.
			
 
				+* Before an SP3 :ref:`abs<amdgpu_synid_abs>` modifier.
			
 
				+
			
 
				+In all other cases "-" is handled as a part of an expression that follows the sign.
			
 
				 
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				+  // Operands with negate modifiers
			
 
				   neg(v[0])
			
 
				-  -v4
			
 
				+  neg(1.0)
			
 
				+  neg(abs(v0))
			
 
				+  -v5
			
 
				+  -abs(v5)
			
 
				+  -\|v5|
			
 
				+
			
 
				+  // Operands without negate modifiers
			
 
				+  -1
			
 
				+  -x+y
			
 
				 
			
 
				 VOP3P Modifiers
			
 
				 ---------------
			
@@ -1304,6 +1364,10 @@ The value 0 selects the low bits, while 1 selects the high bits.
 
				     op_sel:[{0..1},{0..1},{0..1}]     Select operand bits for instructions with 3 source operands.
			
 
				     ================================= =============================================================
			
 
				 
			
 
				+Note: numeric values may be specified as either
			
 
				+:ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				+:ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
@@ -1333,6 +1397,10 @@ The value 0 selects the low bits, while 1 selects the high bits.
 
				     op_sel_hi:[{0..1},{0..1},{0..1}]    Select operand bits for instructions with 3 source operands.
			
 
				     =================================== =============================================================
			
 
				 
			
 
				+Note: numeric values may be specified as either
			
 
				+:ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				+:ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
@@ -1367,6 +1435,10 @@ This modifier is valid for floating point operands only.
 
				     neg_lo:[{0..1},{0..1},{0..1}]    Select affected operands for instructions with 3 source operands.
			
 
				     ================================ ==================================================================
			
 
				 
			
 
				+Note: numeric values may be specified as either
			
 
				+:ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				+:ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
@@ -1401,6 +1473,10 @@ This modifier is valid for floating point operands only.
 
				     neg_hi:[{0..1},{0..1},{0..1}]   Select affected operands for instructions with 3 source operands.
			
 
				     =============================== ==================================================================
			
 
				 
			
 
				+Note: numeric values may be specified as either
			
 
				+:ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				+:ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
@@ -1419,7 +1495,7 @@ VOP3P V_MAD_MIX Modifiers
 
				 -------------------------
			
 
				 
			
 
				 *v_mad_mix_f32*, *v_mad_mixhi_f16* and *v_mad_mixlo_f16* instructions
			
 
				-use *op_sel* and *op_sel_hi* modifiers 
			
 
				+use *op_sel* and *op_sel_hi* modifiers
			
 
				 in a manner different from *regular* VOP3P instructions.
			
 
				 
			
 
				 See a description below.
			
@@ -1449,6 +1525,10 @@ By default, low bits are used for all operands.
 
				     op_sel:[{0..1},{0..1},{0..1}]   Select location of each 16-bit source operand.
			
 
				     =============================== ================================================
			
 
				 
			
 
				+Note: numeric values may be specified as either
			
 
				+:ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				+:ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
@@ -1477,6 +1557,10 @@ The location of 16 bits in the operand may be specified by
 
				     op_sel_hi:[{0..1},{0..1},{0..1}]         Select size of each source operand.
			
 
				     ======================================== ====================================
			
 
				 
			
 
				+Note: numeric values may be specified as either
			
 
				+:ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				+:ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
--- a/docs/AMDGPUOperandSyntax.rst
+++ b/docs/AMDGPUOperandSyntax.rst
@@ -38,7 +38,8 @@ Assembler currently supports sequences of 1, 2, 3, 4, 8 and 16 *vector* register
 
				     =================================================== ====================================================================
			
 
				     **v**\<N>                                           A single 32-bit *vector* register.
			
 
				 
			
 
				-                                                        *N* must be a decimal integer number.
			
 
				+                                                        *N* must be a decimal
			
 
				+                                                        :ref:`integer number<amdgpu_synid_integer_number>`.
			
 
				     **v[**\ <N>\ **]**                                  A single 32-bit *vector* register.
			
 
				 
			
 
				                                                         *N* may be specified as an
			
@@ -51,10 +52,11 @@ Assembler currently supports sequences of 1, 2, 3, 4, 8 and 16 *vector* register
 
				                                                         or :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				     **[v**\ <N>, \ **v**\ <N+1>, ... **v**\ <K>\ **]**  A sequence of (\ *K-N+1*\ ) *vector* registers.
			
 
				 
			
 
				-                                                        Register indices must be specified as decimal integer numbers.
			
 
				+                                                        Register indices must be specified as decimal
			
 
				+                                                        :ref:`integer numbers<amdgpu_synid_integer_number>`.
			
 
				     =================================================== ====================================================================
			
 
				 
			
 
				-Note. *N* and *K* must satisfy the following conditions:
			
 
				+Note: *N* and *K* must satisfy the following conditions:
			
 
				 
			
 
				 * *N* <= *K*.
			
 
				 * 0 <= *N* <= 255.
			
@@ -77,26 +79,27 @@ Examples:
 
				 
			
 
				 .. _amdgpu_synid_nsa:
			
 
				 
			
 
				-*Image* instructions may use special *NSA* (Non-Sequential Address) syntax for *image addresses*:
			
 
				+GFX10 *Image* instructions may use special *NSA* (Non-Sequential Address) syntax for *image addresses*:
			
 
				 
			
 
				-    =================================================== ====================================================================
			
 
				-    Syntax                                              Description
			
 
				-    =================================================== ====================================================================
			
 
				-    **[v**\ <A>, \ **v**\ <B>, ... **v**\ <X>\ **]**    A sequence of *vector* registers. At least one register
			
 
				-                                                        must be specified.
			
 
				+    ===================================== =================================================
			
 
				+    Syntax                                Description
			
 
				+    ===================================== =================================================
			
 
				+    **[Vm**, \ **Vn**, ... **Vk**\ **]**  A sequence of 32-bit *vector* registers.
			
 
				+                                          Each register may be specified using a syntax
			
 
				+                                          defined :ref:`above<amdgpu_synid_v>`.
			
 
				 
			
 
				-                                                        In contrast with standard syntax described above, registers in
			
 
				-                                                        this sequence are not required to have consecutive indices.
			
 
				-                                                        Moreover, the same register may appear in the list more than once.
			
 
				-    =================================================== ====================================================================
			
 
				-
			
 
				-Note. Reqister indices must be in the range 0..255. They must be specified as decimal integer numbers.
			
 
				+                                          In contrast with standard syntax, registers
			
 
				+                                          in *NSA* sequence are not required to have
			
 
				+                                          consecutive indices. Moreover, the same register
			
 
				+                                          may appear in the list more than once.
			
 
				+    ===================================== =================================================
			
 
				 
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-  [v32,v1,v2]
			
 
				+  [v32,v1,v[2]]
			
 
				+  [v[32],v[1:1],[v2]]
			
 
				   [v4,v4,v4,v4]
			
 
				 
			
 
				 .. _amdgpu_synid_s:
			
@@ -126,7 +129,9 @@ Sequences of 4 and more *scalar* registers must be quad-aligned.
 
				     ======================================================== ====================================================================
			
 
				     **s**\ <N>                                               A single 32-bit *scalar* register.
			
 
				 
			
 
				-                                                             *N* must be a decimal integer number.
			
 
				+                                                             *N* must be a decimal
			
 
				+                                                             :ref:`integer number<amdgpu_synid_integer_number>`.
			
 
				+
			
 
				     **s[**\ <N>\ **]**                                       A single 32-bit *scalar* register.
			
 
				 
			
 
				                                                              *N* may be specified as an
			
@@ -137,12 +142,14 @@ Sequences of 4 and more *scalar* registers must be quad-aligned.
 
				                                                              *N* and *K* may be specified as
			
 
				                                                              :ref:`integer numbers<amdgpu_synid_integer_number>`
			
 
				                                                              or :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				     **[s**\ <N>, \ **s**\ <N+1>, ... **s**\ <K>\ **]**       A sequence of (\ *K-N+1*\ ) *scalar* registers.
			
 
				 
			
 
				-                                                             Register indices must be specified as decimal integer numbers.
			
 
				+                                                             Register indices must be specified as decimal
			
 
				+                                                             :ref:`integer numbers<amdgpu_synid_integer_number>`.
			
 
				     ======================================================== ====================================================================
			
 
				 
			
 
				-Note. *N* and *K* must satisfy the following conditions:
			
 
				+Note: *N* and *K* must satisfy the following conditions:
			
 
				 
			
 
				 * *N* must be properly aligned based on sequence size.
			
 
				 * *N* <= *K*.
			
@@ -210,7 +217,8 @@ Sequences of 4 and more *ttmp* registers must be quad-aligned.
 
				     ============================================================= ====================================================================
			
 
				     **ttmp**\ <N>                                                 A single 32-bit *ttmp* register.
			
 
				 
			
 
				-                                                                  *N* must be a decimal integer number.
			
 
				+                                                                  *N* must be a decimal
			
 
				+                                                                  :ref:`integer number<amdgpu_synid_integer_number>`.
			
 
				     **ttmp[**\ <N>\ **]**                                         A single 32-bit *ttmp* register.
			
 
				 
			
 
				                                                                   *N* may be specified as an
			
@@ -223,10 +231,11 @@ Sequences of 4 and more *ttmp* registers must be quad-aligned.
 
				                                                                   or :ref:`absolute expressions<amdgpu_synid_absolute_expression>`.
			
 
				     **[ttmp**\ <N>, \ **ttmp**\ <N+1>, ... **ttmp**\ <K>\ **]**   A sequence of (\ *K-N+1*\ ) *ttmp* registers.
			
 
				 
			
 
				-                                                                  Register indices must be specified as decimal integer numbers.
			
 
				+                                                                  Register indices must be specified as decimal
			
 
				+                                                                  :ref:`integer numbers<amdgpu_synid_integer_number>`.
			
 
				     ============================================================= ====================================================================
			
 
				 
			
 
				-Note. *N* and *K* must satisfy the following conditions:
			
 
				+Note: *N* and *K* must satisfy the following conditions:
			
 
				 
			
 
				 * *N* must be properly aligned based on sequence size.
			
 
				 * *N* <= *K*.
			
@@ -266,8 +275,8 @@ Trap base address, 64-bits wide. Holds the pointer to the current trap handler p
 
				     Syntax             Description                                                             Availability
			
 
				     ================== ======================================================================= =============
			
 
				     tba                64-bit *trap base address* register.                                    GFX7, GFX8
			
 
				-    [tba]              64-bit *trap base address* register (an alternative syntax).            GFX7, GFX8
			
 
				-    [tba_lo,tba_hi]    64-bit *trap base address* register (an alternative syntax).            GFX7, GFX8
			
 
				+    [tba]              64-bit *trap base address* register (an SP3 syntax).                    GFX7, GFX8
			
 
				+    [tba_lo,tba_hi]    64-bit *trap base address* register (an SP3 syntax).                    GFX7, GFX8
			
 
				     ================== ======================================================================= =============
			
 
				 
			
 
				 High and low 32 bits of *trap base address* may be accessed as separate registers:
			
@@ -277,8 +286,8 @@ High and low 32 bits of *trap base address* may be accessed as separate register
 
				     ================== ======================================================================= =============
			
 
				     tba_lo             Low 32 bits of *trap base address* register.                            GFX7, GFX8
			
 
				     tba_hi             High 32 bits of *trap base address* register.                           GFX7, GFX8
			
 
				-    [tba_lo]           Low 32 bits of *trap base address* register (an alternative syntax).    GFX7, GFX8
			
 
				-    [tba_hi]           High 32 bits of *trap base address* register (an alternative syntax).   GFX7, GFX8
			
 
				+    [tba_lo]           Low 32 bits of *trap base address* register (an SP3 syntax).            GFX7, GFX8
			
 
				+    [tba_hi]           High 32 bits of *trap base address* register (an SP3 syntax).           GFX7, GFX8
			
 
				     ================== ======================================================================= =============
			
 
				 
			
 
				 Note that *tba*, *tba_lo* and *tba_hi* are not accessible as assembler registers in GFX9 and GFX10,
			
@@ -295,8 +304,8 @@ Trap memory address, 64-bits wide.
 
				     Syntax            Description                                                             Availability
			
 
				     ================= ======================================================================= ==================
			
 
				     tma               64-bit *trap memory address* register.                                  GFX7, GFX8
			
 
				-    [tma]             64-bit *trap memory address* register (an alternative syntax).          GFX7, GFX8
			
 
				-    [tma_lo,tma_hi]   64-bit *trap memory address* register (an alternative syntax).          GFX7, GFX8
			
 
				+    [tma]             64-bit *trap memory address* register (an SP3 syntax).                  GFX7, GFX8
			
 
				+    [tma_lo,tma_hi]   64-bit *trap memory address* register (an SP3 syntax).                  GFX7, GFX8
			
 
				     ================= ======================================================================= ==================
			
 
				 
			
 
				 High and low 32 bits of *trap memory address* may be accessed as separate registers:
			
@@ -306,8 +315,8 @@ High and low 32 bits of *trap memory address* may be accessed as separate regist
 
				     ================= ======================================================================= ==================
			
 
				     tma_lo            Low 32 bits of *trap memory address* register.                          GFX7, GFX8
			
 
				     tma_hi            High 32 bits of *trap memory address* register.                         GFX7, GFX8
			
 
				-    [tma_lo]          Low 32 bits of *trap memory address* register (an alternative syntax).  GFX7, GFX8
			
 
				-    [tma_hi]          High 32 bits of *trap memory address* register (an alternative syntax). GFX7, GFX8
			
 
				+    [tma_lo]          Low 32 bits of *trap memory address* register (an SP3 syntax).          GFX7, GFX8
			
 
				+    [tma_hi]          High 32 bits of *trap memory address* register (an SP3 syntax).         GFX7, GFX8
			
 
				     ================= ======================================================================= ==================
			
 
				 
			
 
				 Note that *tma*, *tma_lo* and *tma_hi* are not accessible as assembler registers in GFX9 and GFX10,
			
@@ -324,8 +333,8 @@ Flat scratch address, 64-bits wide. Holds the base address of scratch memory.
 
				     Syntax                             Description
			
 
				     ================================== ================================================================
			
 
				     flat_scratch                       64-bit *flat scratch* address register.
			
 
				-    [flat_scratch]                     64-bit *flat scratch* address register (an alternative syntax).
			
 
				-    [flat_scratch_lo,flat_scratch_hi]  64-bit *flat scratch* address register (an alternative syntax).
			
 
				+    [flat_scratch]                     64-bit *flat scratch* address register (an SP3 syntax).
			
 
				+    [flat_scratch_lo,flat_scratch_hi]  64-bit *flat scratch* address register (an SP3 syntax).
			
 
				     ================================== ================================================================
			
 
				 
			
 
				 High and low 32 bits of *flat scratch* address may be accessed as separate registers:
			
@@ -335,8 +344,8 @@ High and low 32 bits of *flat scratch* address may be accessed as separate regis
 
				     ========================= =========================================================================
			
 
				     flat_scratch_lo           Low 32 bits of *flat scratch* address register.
			
 
				     flat_scratch_hi           High 32 bits of *flat scratch* address register.
			
 
				-    [flat_scratch_lo]         Low 32 bits of *flat scratch* address register (an alternative syntax).
			
 
				-    [flat_scratch_hi]         High 32 bits of *flat scratch* address register (an alternative syntax).
			
 
				+    [flat_scratch_lo]         Low 32 bits of *flat scratch* address register (an SP3 syntax).
			
 
				+    [flat_scratch_hi]         High 32 bits of *flat scratch* address register (an SP3 syntax).
			
 
				     ========================= =========================================================================
			
 
				 
			
 
				 .. _amdgpu_synid_xnack:
			
@@ -355,8 +364,8 @@ received an *XNACK* due to a vector memory operation.
 
				     Syntax                         Description
			
 
				     ============================== =====================================================
			
 
				     xnack_mask                     64-bit *xnack mask* register.
			
 
				-    [xnack_mask]                   64-bit *xnack mask* register (an alternative syntax).
			
 
				-    [xnack_mask_lo,xnack_mask_hi]  64-bit *xnack mask* register (an alternative syntax).
			
 
				+    [xnack_mask]                   64-bit *xnack mask* register (an SP3 syntax).
			
 
				+    [xnack_mask_lo,xnack_mask_hi]  64-bit *xnack mask* register (an SP3 syntax).
			
 
				     ============================== =====================================================
			
 
				 
			
 
				 High and low 32 bits of *xnack mask* may be accessed as separate registers:
			
@@ -366,8 +375,8 @@ High and low 32 bits of *xnack mask* may be accessed as separate registers:
 
				     ===================== ==============================================================
			
 
				     xnack_mask_lo         Low 32 bits of *xnack mask* register.
			
 
				     xnack_mask_hi         High 32 bits of *xnack mask* register.
			
 
				-    [xnack_mask_lo]       Low 32 bits of *xnack mask* register (an alternative syntax).
			
 
				-    [xnack_mask_hi]       High 32 bits of *xnack mask* register (an alternative syntax).
			
 
				+    [xnack_mask_lo]       Low 32 bits of *xnack mask* register (an SP3 syntax).
			
 
				+    [xnack_mask_hi]       High 32 bits of *xnack mask* register (an SP3 syntax).
			
 
				     ===================== ==============================================================
			
 
				 
			
 
				 .. _amdgpu_synid_vcc:
			
@@ -385,8 +394,8 @@ Note that GFX10 H/W does not use high 32 bits of *vcc* in *wave32* mode.
 
				     Syntax           Description
			
 
				     ================ =========================================================================
			
 
				     vcc              64-bit *vector condition code* register.
			
 
				-    [vcc]            64-bit *vector condition code* register (an alternative syntax).
			
 
				-    [vcc_lo,vcc_hi]  64-bit *vector condition code* register (an alternative syntax).
			
 
				+    [vcc]            64-bit *vector condition code* register (an SP3 syntax).
			
 
				+    [vcc_lo,vcc_hi]  64-bit *vector condition code* register (an SP3 syntax).
			
 
				     ================ =========================================================================
			
 
				 
			
 
				 High and low 32 bits of *vector condition code* may be accessed as separate registers:
			
@@ -396,8 +405,8 @@ High and low 32 bits of *vector condition code* may be accessed as separate regi
 
				     ================ =========================================================================
			
 
				     vcc_lo           Low 32 bits of *vector condition code* register.
			
 
				     vcc_hi           High 32 bits of *vector condition code* register.
			
 
				-    [vcc_lo]         Low 32 bits of *vector condition code* register (an alternative syntax).
			
 
				-    [vcc_hi]         High 32 bits of *vector condition code* register (an alternative syntax).
			
 
				+    [vcc_lo]         Low 32 bits of *vector condition code* register (an SP3 syntax).
			
 
				+    [vcc_hi]         High 32 bits of *vector condition code* register (an SP3 syntax).
			
 
				     ================ =========================================================================
			
 
				 
			
 
				 .. _amdgpu_synid_m0:
			
@@ -412,7 +421,7 @@ including register indexing and bounds checking.
 
				     Syntax      Description
			
 
				     =========== ===================================================
			
 
				     m0          A 32-bit *memory* register.
			
 
				-    [m0]        A 32-bit *memory* register (an alternative syntax).
			
 
				+    [m0]        A 32-bit *memory* register (an SP3 syntax).
			
 
				     =========== ===================================================
			
 
				 
			
 
				 .. _amdgpu_synid_exec:
			
@@ -430,8 +439,8 @@ Note that GFX10 H/W does not use high 32 bits of *exec* in *wave32* mode.
 
				     Syntax                Description
			
 
				     ===================== =================================================================
			
 
				     exec                  64-bit *execute mask* register.
			
 
				-    [exec]                64-bit *execute mask* register (an alternative syntax).
			
 
				-    [exec_lo,exec_hi]     64-bit *execute mask* register (an alternative syntax).
			
 
				+    [exec]                64-bit *execute mask* register (an SP3 syntax).
			
 
				+    [exec_lo,exec_hi]     64-bit *execute mask* register (an SP3 syntax).
			
 
				     ===================== =================================================================
			
 
				 
			
 
				 High and low 32 bits of *execute mask* may be accessed as separate registers:
			
@@ -441,8 +450,8 @@ High and low 32 bits of *execute mask* may be accessed as separate registers:
 
				     ===================== =================================================================
			
 
				     exec_lo               Low 32 bits of *execute mask* register.
			
 
				     exec_hi               High 32 bits of *execute mask* register.
			
 
				-    [exec_lo]             Low 32 bits of *execute mask* register (an alternative syntax).
			
 
				-    [exec_hi]             High 32 bits of *execute mask* register (an alternative syntax).
			
 
				+    [exec_lo]             Low 32 bits of *execute mask* register (an SP3 syntax).
			
 
				+    [exec_hi]             High 32 bits of *execute mask* register (an SP3 syntax).
			
 
				     ===================== =================================================================
			
 
				 
			
 
				 .. _amdgpu_synid_vccz:
			
@@ -452,7 +461,7 @@ vccz
 
				 
			
 
				 A single bit flag indicating that the :ref:`vcc<amdgpu_synid_vcc>` is all zeros.
			
 
				 
			
 
				-Note. When GFX10 operates in *wave32* mode, this register reflects state of :ref:`vcc_lo<amdgpu_synid_vcc_lo>`.
			
 
				+Note: when GFX10 operates in *wave32* mode, this register reflects state of :ref:`vcc_lo<amdgpu_synid_vcc_lo>`.
			
 
				 
			
 
				 .. _amdgpu_synid_execz:
			
 
				 
			
@@ -461,7 +470,7 @@ execz
 
				 
			
 
				 A single bit flag indicating that the :ref:`exec<amdgpu_synid_exec>` is all zeros.
			
 
				 
			
 
				-Note. When GFX10 operates in *wave32* mode, this register reflects state of :ref:`exec_lo<amdgpu_synid_exec>`.
			
 
				+Note: when GFX10 operates in *wave32* mode, this register reflects state of :ref:`exec_lo<amdgpu_synid_exec>`.
			
 
				 
			
 
				 .. _amdgpu_synid_scc:
			
 
				 
			
@@ -495,19 +504,20 @@ GFX10 only.
 
				 
			
 
				 .. _amdgpu_synid_constant:
			
 
				 
			
 
				-constant
			
 
				---------
			
 
				+inline constant
			
 
				+---------------
			
 
				+
			
 
				+An *inline constant* is an integer or a floating-point value encoded as a part of an instruction.
			
 
				+Compare *inline constants* with :ref:`literals<amdgpu_synid_literal>`.
			
 
				 
			
 
				-A set of integer and floating-point *inline* constants and values:
			
 
				+Inline constants include:
			
 
				 
			
 
				 * :ref:`iconst<amdgpu_synid_iconst>`
			
 
				 * :ref:`fconst<amdgpu_synid_fconst>`
			
 
				 * :ref:`ival<amdgpu_synid_ival>`
			
 
				 
			
 
				-In contrast with :ref:`literals<amdgpu_synid_literal>`, these operands are encoded as a part of instruction.
			
 
				-
			
 
				 If a number may be encoded as either
			
 
				-a :ref:`literal<amdgpu_synid_literal>` or 
			
 
				+a :ref:`literal<amdgpu_synid_literal>` or
			
 
				 a :ref:`constant<amdgpu_synid_constant>`,
			
 
				 assembler selects the latter encoding as more efficient.
			
 
				 
			
@@ -516,17 +526,14 @@ assembler selects the latter encoding as more efficient.
 
				 iconst
			
 
				 ~~~~~~
			
 
				 
			
 
				-An :ref:`integer number<amdgpu_synid_integer_number>`
			
 
				+An :ref:`integer number<amdgpu_synid_integer_number>` or
			
 
				+an :ref:`absolute expression<amdgpu_synid_absolute_expression>`
			
 
				 encoded as an *inline constant*.
			
 
				 
			
 
				 Only a small fraction of integer numbers may be encoded as *inline constants*.
			
 
				 They are enumerated in the table below.
			
 
				 Other integer numbers have to be encoded as :ref:`literals<amdgpu_synid_literal>`.
			
 
				 
			
 
				-Integer *inline constants* are converted to
			
 
				-:ref:`expected operand type<amdgpu_syn_instruction_type>`
			
 
				-as described :ref:`here<amdgpu_synid_int_const_conv>`.
			
 
				-
			
 
				     ================================== ====================================
			
 
				     Value                              Note
			
 
				     ================================== ====================================
			
@@ -548,10 +555,6 @@ Only a small fraction of floating-point numbers may be encoded as *inline consta
 
				 They are enumerated in the table below.
			
 
				 Other floating-point numbers have to be encoded as :ref:`literals<amdgpu_synid_literal>`.
			
 
				 
			
 
				-Floating-point *inline constants* are converted to
			
 
				-:ref:`expected operand type<amdgpu_syn_instruction_type>`
			
 
				-as described :ref:`here<amdgpu_synid_fp_const_conv>`.
			
 
				-
			
 
				     ===================== ===================================================== ==================
			
 
				     Value                 Note                                                  Availability
			
 
				     ===================== ===================================================== ==================
			
@@ -594,21 +597,18 @@ These operands provide read-only access to H/W registers.
 
				 literal
			
 
				 -------
			
 
				 
			
 
				-A literal is a 64-bit value which is encoded as a separate 32-bit dword in the instruction stream.
			
 
				+A *literal* is a 64-bit value encoded as a separate 32-bit dword in the instruction stream.
			
 
				+Compare *literals* with :ref:`inline constants<amdgpu_synid_constant>`.
			
 
				 
			
 
				 If a number may be encoded as either
			
 
				-a :ref:`literal<amdgpu_synid_literal>` or 
			
 
				+a :ref:`literal<amdgpu_synid_literal>` or
			
 
				 an :ref:`inline constant<amdgpu_synid_constant>`,
			
 
				 assembler selects the latter encoding as more efficient.
			
 
				 
			
 
				 Literals may be specified as :ref:`integer numbers<amdgpu_synid_integer_number>`,
			
 
				-:ref:`floating-point numbers<amdgpu_synid_floating-point_number>` or
			
 
				-:ref:`expressions<amdgpu_synid_expression>`
			
 
				-(expressions are currently supported for 32-bit operands only).
			
 
				-
			
 
				-A 64-bit literal value is converted by assembler
			
 
				-to an :ref:`expected operand type<amdgpu_syn_instruction_type>`
			
 
				-as described :ref:`here<amdgpu_synid_lit_conv>`.
			
 
				+:ref:`floating-point numbers<amdgpu_synid_floating-point_number>`,
			
 
				+:ref:`absolute expressions<amdgpu_synid_absolute_expression>` or
			
 
				+:ref:`relocatable expressions<amdgpu_synid_relocatable_expression>`.
			
 
				 
			
 
				 An instruction may use only one literal but several operands may refer the same literal.
			
 
				 
			
@@ -617,30 +617,38 @@ An instruction may use only one literal but several operands may refer the same
 
				 uimm8
			
 
				 -----
			
 
				 
			
 
				-A 8-bit positive :ref:`integer number<amdgpu_synid_integer_number>`.
			
 
				-The value is encoded as part of the opcode so it is free to use.
			
 
				+A 8-bit :ref:`integer number<amdgpu_synid_integer_number>`
			
 
				+or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				+The value must be in the range 0..0xFF.
			
 
				 
			
 
				 .. _amdgpu_synid_uimm32:
			
 
				 
			
 
				 uimm32
			
 
				 ------
			
 
				 
			
 
				-A 32-bit positive :ref:`integer number<amdgpu_synid_integer_number>`.
			
 
				-The value is stored as a separate 32-bit dword in the instruction stream.
			
 
				+A 32-bit :ref:`integer number<amdgpu_synid_integer_number>`
			
 
				+or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				+The value must be in the range 0..0xFFFFFFFF.
			
 
				 
			
 
				 .. _amdgpu_synid_uimm20:
			
 
				 
			
 
				 uimm20
			
 
				 ------
			
 
				 
			
 
				-A 20-bit positive :ref:`integer number<amdgpu_synid_integer_number>`.
			
 
				+A 20-bit :ref:`integer number<amdgpu_synid_integer_number>`
			
 
				+or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				+The value must be in the range 0..0xFFFFF.
			
 
				 
			
 
				 .. _amdgpu_synid_uimm21:
			
 
				 
			
 
				 uimm21
			
 
				 ------
			
 
				 
			
 
				-A 21-bit positive :ref:`integer number<amdgpu_synid_integer_number>`.
			
 
				+A 21-bit :ref:`integer number<amdgpu_synid_integer_number>`
			
 
				+or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				+The value must be in the range 0..0x1FFFFF.
			
 
				 
			
 
				 .. WARNING:: Assembler currently supports 20-bit offsets only. Use :ref:`uimm20<amdgpu_synid_uimm20>` as a replacement.
			
 
				 
			
@@ -649,7 +657,10 @@ A 21-bit positive :ref:`integer number<amdgpu_synid_integer_number>`.
 
				 simm21
			
 
				 ------
			
 
				 
			
 
				-A 21-bit :ref:`integer number<amdgpu_synid_integer_number>`.
			
 
				+A 21-bit :ref:`integer number<amdgpu_synid_integer_number>`
			
 
				+or an :ref:`absolute expression<amdgpu_synid_absolute_expression>`.
			
 
				+
			
 
				+The value must be in the range -0x100000..0x0FFFFF.
			
 
				 
			
 
				 .. WARNING:: Assembler currently supports 20-bit unsigned offsets only. Use :ref:`uimm20<amdgpu_synid_uimm20>` as a replacement.
			
 
				 
			
@@ -678,27 +689,20 @@ Integer Numbers
 
				 ---------------
			
 
				 
			
 
				 Integer numbers are 64 bits wide.
			
 
				-They may be specified in binary, octal, hexadecimal and decimal formats:
			
 
				-
			
 
				-    ============== ====================================
			
 
				-    Format         Syntax
			
 
				-    ============== ====================================
			
 
				-    Decimal        [-]?[1-9][0-9]*
			
 
				-    Binary         [-]?0b[01]+
			
 
				-    Octal          [-]?0[0-7]+
			
 
				-    Hexadecimal    [-]?0x[0-9a-fA-F]+
			
 
				-    \              [-]?[0x]?[0-9][0-9a-fA-F]*[hH]
			
 
				-    ============== ====================================
			
 
				+They are converted to :ref:`expected operand type<amdgpu_syn_instruction_type>`
			
 
				+as described :ref:`here<amdgpu_synid_int_conv>`.
			
 
				 
			
 
				-Examples:
			
 
				+Integer numbers may be specified in binary, octal, hexadecimal and decimal formats:
			
 
				 
			
 
				-.. parsed-literal::
			
 
				-
			
 
				-  -1234
			
 
				-  0b1010
			
 
				-  010
			
 
				-  0xff
			
 
				-  0ffh
			
 
				+    ============ =============================== ========
			
 
				+    Format       Syntax                          Example
			
 
				+    ============ =============================== ========
			
 
				+    Decimal      [-]?[1-9][0-9]*                 -1234
			
 
				+    Binary       [-]?0b[01]+                     0b1010
			
 
				+    Octal        [-]?0[0-7]+                     010
			
 
				+    Hexadecimal  [-]?0x[0-9a-fA-F]+              0xff
			
 
				+    \            [-]?[0x]?[0-9][0-9a-fA-F]*[hH]  0ffh
			
 
				+    ============ =============================== ========
			
 
				 
			
 
				 .. _amdgpu_synid_floating-point_number:
			
 
				 
			
@@ -706,31 +710,29 @@ Floating-Point Numbers
 
				 ----------------------
			
 
				 
			
 
				 All floating-point numbers are handled as double (64 bits wide).
			
 
				+They are converted to
			
 
				+:ref:`expected operand type<amdgpu_syn_instruction_type>`
			
 
				+as described :ref:`here<amdgpu_synid_fp_conv>`.
			
 
				 
			
 
				 Floating-point numbers may be specified in hexadecimal and decimal formats:
			
 
				 
			
 
				-    ============== ======================================================== ========================================================
			
 
				-    Format         Syntax                                                   Note
			
 
				-    ============== ======================================================== ========================================================
			
 
				-    Decimal        [-]?[0-9]*[.][0-9]*([eE][+-]?[0-9]*)?                    Must include either a decimal separator or an exponent.
			
 
				-    Hexadecimal    [-]0x[0-9a-fA-F]*(.[0-9a-fA-F]*)?[pP][+-]?[0-9a-fA-F]+
			
 
				-    ============== ======================================================== ========================================================
			
 
				-
			
 
				-Examples:
			
 
				-
			
 
				-.. parsed-literal::
			
 
				-
			
 
				- -1.234
			
 
				- 234e2
			
 
				- -0x1afp-10
			
 
				- 0x.1afp10
			
 
				+    ============ ======================================================== ====================== ====================
			
 
				+    Format       Syntax                                                   Examples               Note
			
 
				+    ============ ======================================================== ====================== ====================
			
 
				+    Decimal      [-]?[0-9]*[.][0-9]*([eE][+-]?[0-9]*)?                    -1.234, 234e2          Must include either
			
 
				+                                                                                                 a decimal separator
			
 
				+                                                                                                 or an exponent.
			
 
				+    Hexadecimal  [-]0x[0-9a-fA-F]*(.[0-9a-fA-F]*)?[pP][+-]?[0-9a-fA-F]+   -0x1afp-10, 0x.1afp10
			
 
				+    ============ ======================================================== ====================== ====================
			
 
				 
			
 
				 .. _amdgpu_synid_expression:
			
 
				 
			
 
				 Expressions
			
 
				 ===========
			
 
				 
			
 
				-An expression specifies an address or a numeric value.
			
 
				+An expression is evaluated to a 64-bit integer.
			
 
				+Note that floating-point expressions are not supported.
			
 
				+
			
 
				 There are two kinds of expressions:
			
 
				 
			
 
				 * :ref:`Absolute<amdgpu_synid_absolute_expression>`.
			
@@ -741,10 +743,14 @@ There are two kinds of expressions:
 
				 Absolute Expressions
			
 
				 --------------------
			
 
				 
			
 
				-The value of an absolute expression remains the same after program relocation.
			
 
				+The value of an absolute expression does not change after program relocation.
			
 
				 Absolute expressions must not include unassigned and relocatable values
			
 
				 such as labels.
			
 
				 
			
 
				+Absolute expressions are evaluated to 64-bit integer values and converted to
			
 
				+:ref:`expected operand type<amdgpu_syn_instruction_type>`
			
 
				+as described :ref:`here<amdgpu_synid_int_conv>`.
			
 
				+
			
 
				 Examples:
			
 
				 
			
 
				 .. parsed-literal::
			
@@ -760,45 +766,38 @@ Relocatable Expressions
 
				 The value of a relocatable expression depends on program relocation.
			
 
				 
			
 
				 Note that use of relocatable expressions is limited with branch targets
			
 
				-and 32-bit :ref:`literals<amdgpu_synid_literal>`.
			
 
				+and 32-bit integer operands.
			
 
				 
			
 
				-Addition information about relocation may be found :ref:`here<amdgpu-relocation-records>`.
			
 
				-
			
 
				-Examples:
			
 
				+A relocatable expression is evaluated to a 64-bit integer value
			
 
				+which depends on operand kind and :ref:`relocation type<amdgpu-relocation-records>`
			
 
				+of symbol(s) used in the expression. For example, if an instruction refers a label,
			
 
				+this reference is evaluated to an offset from the address after the instruction
			
 
				+to the label address:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-    y = x + 10 // x is not yet defined. Undefined symbols are assumed to be PC-relative.
			
 
				-    z = .
			
 
				-
			
 
				-Expression Data Type
			
 
				---------------------
			
 
				-
			
 
				-Expressions and operands of expressions are interpreted as 64-bit integers.
			
 
				+    label:
			
 
				+    v_add_co_u32_e32 v0, vcc, label, v1  // 'label' operand is evaluated to -4
			
 
				 
			
 
				-Expressions may include 64-bit :ref:`floating-point numbers<amdgpu_synid_floating-point_number>` (double).
			
 
				-However these operands are also handled as 64-bit integers
			
 
				-using binary representation of specified floating-point numbers.
			
 
				-No conversion from floating-point to integer is performed.
			
 
				-
			
 
				-Examples:
			
 
				+Note that values of relocatable expressions are usually unknown at assembly time;
			
 
				+they are resolved later by a linker and converted to
			
 
				+:ref:`expected operand type<amdgpu_syn_instruction_type>`
			
 
				+as described :ref:`here<amdgpu_synid_rl_conv>`.
			
 
				 
			
 
				-.. parsed-literal::
			
 
				+Operands and Operations
			
 
				+-----------------------
			
 
				 
			
 
				-    x = 0.1    // x is assigned an integer 4591870180066957722 which is a binary representation of 0.1.
			
 
				-    y = x + x  // y is a sum of two integer values; it is not equal to 0.2!
			
 
				+Expressions are composed of 64-bit integer operands and operations.
			
 
				+Operands include :ref:`integer numbers<amdgpu_synid_integer_number>`
			
 
				+and :ref:`symbols<amdgpu_synid_symbol>`.
			
 
				 
			
 
				-Syntax
			
 
				-------
			
 
				+Expressions may also use "." which is a reference to the current PC (program counter).
			
 
				 
			
 
				-Expressions are composed of
			
 
				-:ref:`symbols<amdgpu_synid_symbol>`,
			
 
				-:ref:`integer numbers<amdgpu_synid_integer_number>`,
			
 
				-:ref:`floating-point numbers<amdgpu_synid_floating-point_number>`,
			
 
				-:ref:`binary operators<amdgpu_synid_expression_bin_op>`,
			
 
				-:ref:`unary operators<amdgpu_synid_expression_un_op>` and subexpressions.
			
 
				+:ref:`Unary<amdgpu_synid_expression_un_op>` and :ref:`binary<amdgpu_synid_expression_bin_op>`
			
 
				+operations produce 64-bit integer results.
			
 
				 
			
 
				-Expressions may also use "." which is a reference to the current PC (program counter).
			
 
				+Syntax of Expressions
			
 
				+---------------------
			
 
				 
			
 
				 The syntax of expressions is shown below::
			
 
				 
			
@@ -887,7 +886,7 @@ They operate on and produce 64-bit integers.
 
				 Symbols
			
 
				 -------
			
 
				 
			
 
				-A symbol is a named 64-bit value, representing a relocatable
			
 
				+A symbol is a named 64-bit integer value, representing a relocatable
			
 
				 address or an absolute (non-relocatable) number.
			
 
				 
			
 
				 Symbol names have the following syntax:
			
@@ -907,128 +906,78 @@ The table below provides several examples of syntax used for symbol definition.
 
				 A symbol may be used before it is declared or assigned;
			
 
				 unassigned symbols are assumed to be PC-relative.
			
 
				 
			
 
				-Addition information about symbols may be found :ref:`here<amdgpu-symbols>`.
			
 
				+Additional information about symbols may be found :ref:`here<amdgpu-symbols>`.
			
 
				 
			
 
				 .. _amdgpu_synid_conv:
			
 
				 
			
 
				-Conversions
			
 
				-===========
			
 
				+Type and Size Conversion
			
 
				+========================
			
 
				 
			
 
				 This section describes what happens when a 64-bit
			
 
				 :ref:`integer number<amdgpu_synid_integer_number>`, a
			
 
				-:ref:`floating-point numbers<amdgpu_synid_floating-point_number>` or a
			
 
				-:ref:`symbol<amdgpu_synid_symbol>`
			
 
				+:ref:`floating-point number<amdgpu_synid_floating-point_number>` or an
			
 
				+:ref:`expression<amdgpu_synid_expression>`
			
 
				 is used for an operand which has a different type or size.
			
 
				 
			
 
				-Depending on operand kind, this conversion is performed by either assembler or AMDGPU H/W:
			
 
				-
			
 
				-* Values encoded as :ref:`inline constants<amdgpu_synid_constant>` are handled by H/W.
			
 
				-* Values encoded as :ref:`literals<amdgpu_synid_literal>` are converted by assembler.
			
 
				-
			
 
				-.. _amdgpu_synid_const_conv:
			
 
				-
			
 
				-Inline Constants
			
 
				-----------------
			
 
				-
			
 
				-.. _amdgpu_synid_int_const_conv:
			
 
				-
			
 
				-Integer Inline Constants
			
 
				-~~~~~~~~~~~~~~~~~~~~~~~~
			
 
				-
			
 
				-Integer :ref:`inline constants<amdgpu_synid_constant>`
			
 
				-may be thought of as 64-bit
			
 
				-:ref:`integer numbers<amdgpu_synid_integer_number>`;
			
 
				-when used as operands they are truncated to the size of
			
 
				-:ref:`expected operand type<amdgpu_syn_instruction_type>`.
			
 
				-No data type conversions are performed.
			
 
				-
			
 
				-Examples:
			
 
				-
			
 
				-.. parsed-literal::
			
 
				-
			
 
				-    // GFX9
			
 
				-
			
 
				-    v_add_u16 v0, -1, 0    // v0 = 0xFFFF
			
 
				-    v_add_f16 v0, -1, 0    // v0 = 0xFFFF (NaN)
			
 
				-
			
 
				-    v_add_u32 v0, -1, 0    // v0 = 0xFFFFFFFF
			
 
				-    v_add_f32 v0, -1, 0    // v0 = 0xFFFFFFFF (NaN)
			
 
				+.. _amdgpu_synid_int_conv:
			
 
				 
			
 
				-.. _amdgpu_synid_fp_const_conv:
			
 
				+Conversion of Integer Values
			
 
				+----------------------------
			
 
				 
			
 
				-Floating-Point Inline Constants
			
 
				-~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
			
 
				+Instruction operands may be specified as 64-bit :ref:`integer numbers<amdgpu_synid_integer_number>` or
			
 
				+:ref:`absolute expressions<amdgpu_synid_absolute_expression>`. These values are converted to
			
 
				+the :ref:`expected operand type<amdgpu_syn_instruction_type>` using the following steps:
			
 
				 
			
 
				-Floating-point :ref:`inline constants<amdgpu_synid_constant>`
			
 
				-may be thought of as 64-bit
			
 
				-:ref:`floating-point numbers<amdgpu_synid_floating-point_number>`;
			
 
				-when used as operands they are converted to a floating-point number of
			
 
				-:ref:`expected operand size<amdgpu_syn_instruction_type>`.
			
 
				+1. *Validation*. Assembler checks if the input value may be truncated without loss to the required *truncation width*
			
 
				+(see the table below). There are two cases when this operation is enabled:
			
 
				 
			
 
				-Examples:
			
 
				-
			
 
				-.. parsed-literal::
			
 
				-
			
 
				-    // GFX9
			
 
				-
			
 
				-    v_add_f16 v0, 1.0, 0    // v0 = 0x3C00 (1.0)
			
 
				-    v_add_u16 v0, 1.0, 0    // v0 = 0x3C00
			
 
				-
			
 
				-    v_add_f32 v0, 1.0, 0    // v0 = 0x3F800000 (1.0)
			
 
				-    v_add_u32 v0, 1.0, 0    // v0 = 0x3F800000
			
 
				-
			
 
				-
			
 
				-.. _amdgpu_synid_lit_conv:
			
 
				-
			
 
				-Literals
			
 
				---------
			
 
				+    * The truncated bits are all 0.
			
 
				+    * The truncated bits are all 1 and the value after truncation has its MSB bit set.
			
 
				 
			
 
				-.. _amdgpu_synid_int_lit_conv:
			
 
				+In all other cases assembler triggers an error.
			
 
				 
			
 
				-Integer Literals
			
 
				-~~~~~~~~~~~~~~~~
			
 
				+2. *Conversion*. The input value is converted to the expected type as described in the table below.
			
 
				+Depending on operand kind, this conversion is performed by either assembler or AMDGPU H/W (or both).
			
 
				 
			
 
				-Integer :ref:`literals<amdgpu_synid_literal>`
			
 
				-are specified as 64-bit :ref:`integer numbers<amdgpu_synid_integer_number>`.
			
 
				+    ============== ================= =============== ====================================================================
			
 
				+    Expected type  Truncation Width  Conversion      Description
			
 
				+    ============== ================= =============== ====================================================================
			
 
				+    i16, u16, b16  16                num.u16         Truncate to 16 bits.
			
 
				+    i32, u32, b32  32                num.u32         Truncate to 32 bits.
			
 
				+    i64            32                {-1,num.i32}    Truncate to 32 bits and then sign-extend the result to 64 bits.
			
 
				+    u64, b64       32                {0,num.u32}     Truncate to 32 bits and then zero-extend the result to 64 bits.
			
 
				+    f16            16                num.u16         Use low 16 bits as an f16 value.
			
 
				+    f32            32                num.u32         Use low 32 bits as an f32 value.
			
 
				+    f64            32                {num.u32,0}     Use low 32 bits of the number as high 32 bits
			
 
				+                                                     of the result; low 32 bits of the result are zeroed.
			
 
				+    ============== ================= =============== ====================================================================
			
 
				 
			
 
				-When used as operands they are converted to
			
 
				-:ref:`expected operand type<amdgpu_syn_instruction_type>` as described below.
			
 
				-
			
 
				-    ============== ============== =============== ====================================================================
			
 
				-    Expected type  Condition      Result          Note
			
 
				-    ============== ============== =============== ====================================================================
			
 
				-    i16, u16, b16  cond(num,16)   num.u16         Truncate to 16 bits.
			
 
				-    i32, u32, b32  cond(num,32)   num.u32         Truncate to 32 bits.
			
 
				-    i64            cond(num,32)   {-1,num.i32}    Truncate to 32 bits and then sign-extend the result to 64 bits.
			
 
				-    u64, b64       cond(num,32)   { 0,num.u32}    Truncate to 32 bits and then zero-extend the result to 64 bits.
			
 
				-    f16            cond(num,16)   num.u16         Use low 16 bits as an f16 value.
			
 
				-    f32            cond(num,32)   num.u32         Use low 32 bits as an f32 value.
			
 
				-    f64            cond(num,32)   {num.u32,0}     Use low 32 bits of the number as high 32 bits
			
 
				-                                                  of the result; low 32 bits of the result are zeroed.
			
 
				-    ============== ============== =============== ====================================================================
			
 
				-
			
 
				-The condition *cond(X,S)* indicates if a 64-bit number *X*
			
 
				-can be converted to a smaller size *S* by truncation of upper bits.
			
 
				-There are two cases when the conversion is possible:
			
 
				-
			
 
				-* The truncated bits are all 0.
			
 
				-* The truncated bits are all 1 and the value after truncation has its MSB bit set.
			
 
				-
			
 
				-Examples of valid literals:
			
 
				+Examples of enabled conversions:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				     // GFX9
			
 
				-                                             // Literal value after conversion:
			
 
				-    v_add_u16 v0, 0xff00, v0                 //   0xff00
			
 
				-    v_add_u16 v0, 0xffffffffffffff00, v0     //   0xff00
			
 
				-    v_add_u16 v0, -256, v0                   //   0xff00
			
 
				-                                             // Literal value after conversion:
			
 
				-    s_bfe_i64 s[0:1], 0xffefffff, s3         //   0xffffffffffefffff
			
 
				-    s_bfe_u64 s[0:1], 0xffefffff, s3         //   0x00000000ffefffff
			
 
				-    v_ceil_f64_e32 v[0:1], 0xffefffff        //   0xffefffff00000000 (-1.7976922776554302e308)
			
 
				 
			
 
				-Examples of invalid literals:
			
 
				+    v_add_u16 v0, -1, 0                   // src0 = 0xFFFF
			
 
				+    v_add_f16 v0, -1, 0                   // src0 = 0xFFFF (NaN)
			
 
				+                                          //
			
 
				+    v_add_u32 v0, -1, 0                   // src0 = 0xFFFFFFFF
			
 
				+    v_add_f32 v0, -1, 0                   // src0 = 0xFFFFFFFF (NaN)
			
 
				+                                          //
			
 
				+    v_add_u16 v0, 0xff00, v0              // src0 = 0xff00
			
 
				+    v_add_u16 v0, 0xffffffffffffff00, v0  // src0 = 0xff00
			
 
				+    v_add_u16 v0, -256, v0                // src0 = 0xff00
			
 
				+                                          //
			
 
				+    s_bfe_i64 s[0:1], 0xffefffff, s3      // src0 = 0xffffffffffefffff
			
 
				+    s_bfe_u64 s[0:1], 0xffefffff, s3      // src0 = 0x00000000ffefffff
			
 
				+    v_ceil_f64_e32 v[0:1], 0xffefffff     // src0 = 0xffefffff00000000 (-1.7976922776554302e308)
			
 
				+                                          //
			
 
				+    x = 0xffefffff                        //
			
 
				+    s_bfe_i64 s[0:1], x, s3               // src0 = 0xffffffffffefffff
			
 
				+    s_bfe_u64 s[0:1], x, s3               // src0 = 0x00000000ffefffff
			
 
				+    v_ceil_f64_e32 v[0:1], x              // src0 = 0xffefffff00000000 (-1.7976922776554302e308)
			
 
				+
			
 
				+Examples of disabled conversions:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
@@ -1037,49 +986,57 @@ Examples of invalid literals:
 
				     v_add_u16 v0, 0x1ff00, v0               // truncated bits are not all 0 or 1
			
 
				     v_add_u16 v0, 0xffffffffffff00ff, v0    // truncated bits do not match MSB of the result
			
 
				 
			
 
				-.. _amdgpu_synid_fp_lit_conv:
			
 
				+.. _amdgpu_synid_fp_conv:
			
 
				 
			
 
				-Floating-Point Literals
			
 
				-~~~~~~~~~~~~~~~~~~~~~~~
			
 
				+Conversion of Floating-Point Values
			
 
				+-----------------------------------
			
 
				 
			
 
				-Floating-point :ref:`literals<amdgpu_synid_literal>` are specified as 64-bit
			
 
				-:ref:`floating-point numbers<amdgpu_synid_floating-point_number>`.
			
 
				+Instruction operands may be specified as 64-bit :ref:`floating-point numbers<amdgpu_synid_floating-point_number>`.
			
 
				+These values are converted to the :ref:`expected operand type<amdgpu_syn_instruction_type>` using the following steps:
			
 
				 
			
 
				-When used as operands they are converted to
			
 
				-:ref:`expected operand type<amdgpu_syn_instruction_type>` as described below.
			
 
				+1. *Validation*. Assembler checks if the input f64 number can be converted
			
 
				+to the *required floating-point type* (see the table below) without overflow or underflow.
			
 
				+Precision lost is allowed. If this conversion is not possible, assembler triggers an error.
			
 
				 
			
 
				-    ============== ============== ================= =================================================================
			
 
				-    Expected type  Condition      Result            Note
			
 
				-    ============== ============== ================= =================================================================
			
 
				-    i16, u16, b16  cond(num,16)   f16(num)          Convert to f16 and use bits of the result as an integer value.
			
 
				-    i32, u32, b32  cond(num,32)   f32(num)          Convert to f32 and use bits of the result as an integer value.
			
 
				-    i64, u64, b64  false          \-                Conversion disabled because of an unclear semantics.
			
 
				-    f16            cond(num,16)   f16(num)          Convert to f16.
			
 
				-    f32            cond(num,32)   f32(num)          Convert to f32.
			
 
				-    f64            true           {num.u32.hi,0}    Use high 32 bits of the number as high 32 bits of the result;
			
 
				-                                                    zero-fill low 32 bits of the result.
			
 
				+2. *Conversion*. The input value is converted to the expected type as described in the table below.
			
 
				+Depending on operand kind, this is performed by either assembler or AMDGPU H/W (or both).
			
 
				 
			
 
				-                                                    Note that the result may differ from the original number.
			
 
				-    ============== ============== ================= =================================================================
			
 
				+    ============== ================ ================= =================================================================
			
 
				+    Expected type  Required FP Type Conversion        Description
			
 
				+    ============== ================ ================= =================================================================
			
 
				+    i16, u16, b16  f16              f16(num)          Convert to f16 and use bits of the result as an integer value.
			
 
				+    i32, u32, b32  f32              f32(num)          Convert to f32 and use bits of the result as an integer value.
			
 
				+    i64, u64, b64  \-               \-                Conversion disabled.
			
 
				+    f16            f16              f16(num)          Convert to f16.
			
 
				+    f32            f32              f32(num)          Convert to f32.
			
 
				+    f64            f64              {num.u32.hi,0}    Use high 32 bits of the number as high 32 bits of the result;
			
 
				+                                                      zero-fill low 32 bits of the result.
			
 
				 
			
 
				-The condition *cond(X,S)* indicates if an f64 number *X* can be converted
			
 
				-to a smaller *S*-bit floating-point type without overflow or underflow.
			
 
				-Precision lost is allowed.
			
 
				+                                                      Note that the result may differ from the original number.
			
 
				+    ============== ================ ================= =================================================================
			
 
				 
			
 
				-Examples of valid literals:
			
 
				+Examples of enabled conversions:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				     // GFX9
			
 
				 
			
 
				-    v_add_f16 v1, 65500.0, v2
			
 
				-    v_add_f32 v1, 65600.0, v2
			
 
				+    v_add_f16 v0, 1.0, 0        // src0 = 0x3C00 (1.0)
			
 
				+    v_add_u16 v0, 1.0, 0        // src0 = 0x3C00
			
 
				+                                //
			
 
				+    v_add_f32 v0, 1.0, 0        // src0 = 0x3F800000 (1.0)
			
 
				+    v_add_u32 v0, 1.0, 0        // src0 = 0x3F800000
			
 
				 
			
 
				-    // Literal value before conversion: 1.7976931348623157e308 (0x7fefffffffffffff)
			
 
				-    // Literal value after conversion:  1.7976922776554302e308 (0x7fefffff00000000)
			
 
				+                                // src0 before conversion:
			
 
				+                                //   1.7976931348623157e308 = 0x7fefffffffffffff
			
 
				+                                // src0 after conversion:
			
 
				+                                //   1.7976922776554302e308 = 0x7fefffff00000000
			
 
				     v_ceil_f64 v[0:1], 1.7976931348623157e308
			
 
				 
			
 
				-Examples of invalid literals:
			
 
				+    v_add_f16 v1, 65500.0, v2   // ok for f16.
			
 
				+    v_add_f32 v1, 65600.0, v2   // ok for f32, but would result in overflow for f16.
			
 
				+
			
 
				+Examples of disabled conversions:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
@@ -1087,25 +1044,35 @@ Examples of invalid literals:
 
				 
			
 
				     v_add_f16 v1, 65600.0, v2    // overflow
			
 
				 
			
 
				-.. _amdgpu_synid_exp_conv:
			
 
				+.. _amdgpu_synid_rl_conv:
			
 
				 
			
 
				-Expressions
			
 
				-~~~~~~~~~~~
			
 
				+Conversion of Relocatable Values
			
 
				+--------------------------------
			
 
				 
			
 
				-Expressions operate with and result in 64-bit integers.
			
 
				+:ref:`Relocatable expressions<amdgpu_synid_relocatable_expression>`
			
 
				+may be used with 32-bit integer operands and jump targets.
			
 
				 
			
 
				-When used as operands they are truncated to
			
 
				-:ref:`expected operand size<amdgpu_syn_instruction_type>`.
			
 
				-No data type conversions are performed.
			
 
				+When the value of a relocatable expression is resolved by a linker, it is
			
 
				+converted as needed and truncated to the operand size. The conversion depends
			
 
				+on :ref:`relocation type<amdgpu-relocation-records>` and operand kind.
			
 
				 
			
 
				-Examples:
			
 
				+For example, when a 32-bit operand of an instruction refers a relocatable expression *expr*,
			
 
				+this reference is evaluated to a 64-bit offset from the address after the
			
 
				+instruction to the address being referenced, *counted in bytes*.
			
 
				+Then the value is truncated to 32 bits and encoded as a literal:
			
 
				 
			
 
				 .. parsed-literal::
			
 
				 
			
 
				-    // GFX9
			
 
				+    expr = .
			
 
				+    v_add_co_u32_e32 v0, vcc, expr, v1  // 'expr' operand is evaluated to -4
			
 
				+                                        // and then truncated to 0xFFFFFFFC
			
 
				 
			
 
				-    x = 0.1
			
 
				-    v_sqrt_f32 v0, x           // v0 = [low 32 bits of 0.1 (double)]
			
 
				-    v_sqrt_f32 v0, (0.1 + 0)   // the same as above
			
 
				-    v_sqrt_f32 v0, 0.1         // v0 = [0.1 (double) converted to float]
			
 
				+As another example, when a branch instruction refers a label,
			
 
				+this reference is evaluated to an offset from the address after the
			
 
				+instruction to the label address, *counted in dwords*.
			
 
				+Then the value is truncated to 16 bits:
			
 
				+
			
 
				+.. parsed-literal::
			
 
				 
			
 
				+    label:
			
 
				+    s_branch label  // 'label' operand is evaluated to -1 and truncated to 0xFFFF