diff --git a/src/panfrost/compiler/bifrost/valhall/ISA.xml b/src/panfrost/compiler/bifrost/valhall/ISA.xml
index 3eceeb8f7bd..e40298edb3d 100644
--- a/src/panfrost/compiler/bifrost/valhall/ISA.xml
+++ b/src/panfrost/compiler/bifrost/valhall/ISA.xml
@@ -1,5 +1,6 @@
 <!--
   Copyright (C) 2021 Collabora Ltd.
+  Copyright (C) 2026 Arm Ltd.
   SPDX-License-Identifier: MIT
 -->
 
@@ -790,7 +791,8 @@
        instruction isn't generated yet, but it may also be because there
        is a duplicate instruction in the Bifrost or pseudo XML files
   -->
-  <ins name="NOP" title="No operation" dests="0" opcode="0x00" unused="true" unit="CVT">
+  <ins name="NOP" title="No operation" dests="0" unused="true" unit="CVT">
+    <opcode val="0x00" start="48" mask="0x1FF"/>
     <desc>
       Do nothing. Useful at the start of a block for waiting on slots required
       by the first actual instruction of the block, to reconcile dependencies
@@ -798,7 +800,8 @@
     </desc>
   </ins>
 
-  <ins name="BRANCHZ" title="Compare to zero and branch" dests="0" opcode="0x1F" unused="true" unit="CVT">
+  <ins name="BRANCHZ" title="Compare to zero and branch" dests="0" unused="true" unit="CVT">
+    <opcode val="0x1F" start="48" mask="0x1FF"/>
     <desc>
       Branches to a specified relative offset if its source is nonzero (default)
       or if its source is zero (if `.eq` is set). The offset is 27-bits and
@@ -820,7 +823,8 @@
     <va_mod name="eq" start="36" size="1"/>
   </ins>
 
-  <ins name="DISCARD.f32" title="Discard fragment" dests="0" opcode="0x20" unused="true" unit="CVT">
+  <ins name="DISCARD.f32" title="Discard fragment" dests="0" unused="true" unit="CVT">
+    <opcode val="0x20" start="48" mask="0x1FF"/>
     <desc>
       Evaluates the given condition, and if it passes, discards the current
       fragment and terminates the thread. Only valid in a **fragment** shader.
@@ -830,7 +834,8 @@
     <src absneg="true" swizzle="true">Right value to compare</src>
   </ins>
 
-  <ins name="BRANCHZI" title="Compare to zero and branch indirect" opcode="0x2F" dests="0" last="true" unit="CVT">
+  <ins name="BRANCHZI" title="Compare to zero and branch indirect" dests="0" last="true" unit="CVT">
+    <opcode val="0x2F" start="48" mask="0x1FF"/>
     <desc>
       Jump to an indirectly specified (absolute or relative) address. Used to
       jump to blend shaders at the end of a fragment shader.
@@ -842,7 +847,8 @@
     <va_mod name="absolute" start="40" size="1"/>
   </ins>
 
-  <ins name="BARRIER" title="Execution and memory barrier" opcode="0x45" unused="true" unit="NONE">
+  <ins name="BARRIER" title="Execution and memory barrier" unused="true" unit="NONE">
+    <opcode val="0x45" start="48" mask="0x1FF"/>
     <desc>
       General-purpose barrier. Must use slot #7. Must be paired with a
       `.wait` flow on the instruction.
@@ -851,8 +857,12 @@
   </ins>
 
   <group name="CSEL" title="Floating-point conditional select" dests="1" unused="true" unit="CVT">
-    <ins name="CSEL.f32" opcode="0x154"/>
-    <ins name="CSEL.v2f16" opcode="0x155"/>
+    <ins name="CSEL.f32">
+      <opcode val="0x154" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="CSEL.v2f16">
+      <opcode val="0x155" start="48" mask="0x1FF"/>
+    </ins>
     <desc>
       Evaluates the given condition and outputs either the true source or the
       false source.
@@ -865,10 +875,18 @@
   </group>
 
   <group name="CSEL" title="Integer conditional select" dests="1" unused="true" unit="CVT">
-    <ins name="CSEL.u32" opcode="0x150"/>
-    <ins name="CSEL.v2u16" opcode="0x151"/>
-    <ins name="CSEL.s32" opcode="0x158"/>
-    <ins name="CSEL.v2s16" opcode="0x159"/>
+    <ins name="CSEL.u32">
+      <opcode val="0x150" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="CSEL.v2u16">
+      <opcode val="0x151" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="CSEL.s32">
+      <opcode val="0x158" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="CSEL.v2s16">
+      <opcode val="0x159" start="48" mask="0x1FF"/>
+    </ins>
     <desc>
       Evaluates the given condition and outputs either the true source or the
       false source.
@@ -885,7 +903,8 @@
     <src>Return value if false</src>
   </group>
 
-  <ins name="LD_VAR_SPECIAL" title="Load special varying" opcode="0x56" unused="true" unit="V">
+  <ins name="LD_VAR_SPECIAL" title="Load special varying" unused="true" unit="V">
+    <opcode val="0x56" start="48" mask="0x1FF"/>
     <sr write="true"/>
     <sr_count/>
     <vecsize/>
@@ -899,8 +918,12 @@
 
   <group name="LD_VAR_BUF_IMM" title="Load immediate varying" message="varying" unit="V">
     <desc>Interpolates a given varying from hardware buffer</desc>
-    <ins name="LD_VAR_BUF_IMM.f32" opcode="0x5C"/>
-    <ins name="LD_VAR_BUF_IMM.f16" opcode="0x5D"/>
+    <ins name="LD_VAR_BUF_IMM.f32">
+      <opcode val="0x5C" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="LD_VAR_BUF_IMM.f16">
+      <opcode val="0x5D" start="48" mask="0x1FF"/>
+    </ins>
     <slot/>
     <vecsize/>
     <source_format/>
@@ -915,8 +938,12 @@
 
   <group name="LD_VAR_BUF" title="Load indirect varying" message="varying" unit="V">
     <desc>Interpolates a given varying from hardware buffer</desc>
-    <ins name="LD_VAR_BUF.f32" opcode="0x6C"/>
-    <ins name="LD_VAR_BUF.f16" opcode="0x6D"/>
+    <ins name="LD_VAR_BUF.f32">
+      <opcode val="0x6C" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="LD_VAR_BUF.f16">
+      <opcode val="0x6D" start="48" mask="0x1FF"/>
+    </ins>
     <slot/>
     <vecsize/>
     <source_format/>
@@ -929,7 +956,8 @@
     <src/>
   </group>
 
-  <ins name="LD_VAR" title="Load indirect varying" unused="true" unit="V" opcode="0x64">
+  <ins name="LD_VAR" title="Load indirect varying" unused="true" unit="V">
+    <opcode val="0x64" start="48" mask="0x1FF"/>
     <desc>Interpolates a given varying from a software buffer</desc>
     <slot/>
     <vecsize/>
@@ -942,7 +970,8 @@
     <src>Varying index and table</src>
   </ins>
 
-  <ins name="LD_VAR_IMM" title="Load immediate varying" unused="true" unit="V" opcode="0x54">
+  <ins name="LD_VAR_IMM" title="Load immediate varying" unused="true" unit="V">
+    <opcode val="0x54" start="48" mask="0x1FF"/>
     <desc>Interpolates a given varying from a software buffer</desc>
     <slot/>
     <vecsize/>
@@ -956,7 +985,8 @@
     <imm name="index" start="12" size="8"/>
   </ins>
 
-  <ins name="LD_VAR_FLAT" title="Load indirect varying" unused="true" unit="V" opcode="0x55">
+  <ins name="LD_VAR_FLAT" title="Load indirect varying" unused="true" unit="V">
+    <opcode val="0x55" start="48" mask="0x1FF"/>
     <desc>Fetches a given varying from a software buffer</desc>
     <slot/>
     <vecsize/>
@@ -966,7 +996,8 @@
     <src>Varying index and table</src>
   </ins>
 
-  <ins name="LD_VAR_FLAT_IMM" title="Load immediate varying" unused="true" unit="V" opcode="0x41">
+  <ins name="LD_VAR_FLAT_IMM" title="Load immediate varying" unused="true" unit="V">
+    <opcode val="0x41" start="48" mask="0x1FF"/>
     <desc>Fetches a given varying from a software buffer</desc>
     <slot/>
     <vecsize/>
@@ -977,7 +1008,8 @@
     <imm name="index" start="12" size="8"/>
   </ins>
 
-  <ins name="LD_ATTR_IMM" title="Load immediate attribute" opcode="0x66" opcode2="0" unused="true" unit="LS">
+  <ins name="LD_ATTR_IMM" title="Load immediate attribute" opcode2="0" unused="true" unit="LS">
+    <opcode val="0x66" start="48" mask="0x1FF"/>
     <desc>
       Load `vecsize` components from the attribute descriptor at entry `index`
       of resource table `table` at index (vertex ID, instance ID), converting
@@ -995,7 +1027,8 @@
     <imm name="table" start="16" size="4"/>
   </ins>
 
-  <ins name="LD_ATTR" title="Load indirect attribute" opcode="0x76" opcode2="0" unused="true" unit="LS">
+  <ins name="LD_ATTR" title="Load indirect attribute" opcode2="0" unused="true" unit="LS">
+    <opcode val="0x76" start="48" mask="0x1FF"/>
     <desc>
       Load `vecsize` components from the attribute descriptor at the specified
       location at index (vertex ID, instance ID), converting
@@ -1014,14 +1047,16 @@
     <src>Index and table</src>
   </ins>
 
-  <ins name="LD_GCLK_U64" title="Global clock load" opcode="0x44" unused="true" unit="LS">
+  <ins name="LD_GCLK_U64" title="Global clock load" unused="true" unit="LS">
+    <opcode val="0x44" start="48" mask="0x1FF"/>
     <desc>Load the 64-bit global clock, either a cycle counter or the system clock.</desc>
     <sr write="true"/>
     <sr_count count="2"/>
     <slot/>
   </ins>
 
-  <ins name="LD_TEX_IMM" title="Load immediate texture" opcode="0x66" opcode2="1" message="attribute" unit="LS">
+  <ins name="LD_TEX_IMM" title="Load immediate texture" opcode2="1" message="attribute" unit="LS">
+    <opcode val="0x66" start="48" mask="0x1FF"/>
     <desc>
       Load `vecsize` components from the texture descriptor at entry `index`
       of resource table `table`, converting
@@ -1039,7 +1074,8 @@
     <imm name="table" ir_name="" start="16" size="4"/>
   </ins>
 
-  <ins name="LD_TEX" title="Load indirect texture" message="attribute" opcode="0x76" opcode2="1" unit="LS">
+  <ins name="LD_TEX" title="Load indirect texture" message="attribute" opcode2="1" unit="LS">
+    <opcode val="0x76" start="48" mask="0x1FF"/>
     <desc>
       Load `vecsize` components from the texture descriptor at the specified
       location at index, converting
@@ -1056,7 +1092,8 @@
     <src>Index and table</src>
   </ins>
 
-  <ins name="LEA_ATTR_IMM" title="Load effective address of image texel" opcode="0x67" opcode2="0" unused="true" unit="LS">
+  <ins name="LEA_ATTR_IMM" title="Load effective address of image texel" opcode2="0" unused="true" unit="LS">
+    <opcode val="0x67" start="48" mask="0x1FF"/>
     <desc>
       Load the effective address of an attribute specified with the
       given immediate index. Returns three staging register: the low/high
@@ -1072,7 +1109,8 @@
     <imm name="index" start="20" size="4"/>
   </ins>
 
-  <ins name="LEA_ATTR" title="Load effective address of image texel" opcode="0x77" opcode2="0" unused="true" unit="LS">
+  <ins name="LEA_ATTR" title="Load effective address of image texel" opcode2="0" unused="true" unit="LS">
+    <opcode val="0x77" start="48" mask="0x1FF"/>
     <desc>
       Load the effective address of an attribute specified with the
       given index. Returns three staging register: the low/high
@@ -1088,7 +1126,8 @@
     <src>Attribute index and table</src>
   </ins>
 
-  <ins name="LEA_TEX_IMM" title="Load effective address of image texel" opcode="0x67" opcode2="1" unused="true" unit="LS">
+  <ins name="LEA_TEX_IMM" title="Load effective address of image texel" opcode2="1" unused="true" unit="LS">
+    <opcode val="0x67" start="48" mask="0x1FF"/>
     <desc>
       Load the effective address of a texel from the image specified with the
       given immediate index. Returns three staging registers: the low/high
@@ -1109,7 +1148,8 @@
     <imm name="index" start="20" size="4"/>
   </ins>
 
-  <ins name="LEA_TEX" title="Load effective address of image texel" opcode="0x77" opcode2="1" unused="true" unit="LS">
+  <ins name="LEA_TEX" title="Load effective address of image texel" opcode2="1" unused="true" unit="LS">
+    <opcode val="0x77" start="48" mask="0x1FF"/>
     <desc>
       Load the effective address of a texel from the image specified with the
       given index. Returns three staging register: the low/high
@@ -1130,7 +1170,8 @@
     <src>Index and table</src>
   </ins>
 
-  <ins name="LD_PKA.i8" title="Global memory load" message="load" opcode="0x6a" opcode2="0" unit="LS">
+  <ins name="LD_PKA.i8" title="Global memory load" message="load" opcode2="0" unit="LS">
+    <opcode val="0x6A" start="48" mask="0x1FF"/>
     <desc>
       Loads a buffer descriptor. If bits 25...31 of the mode descriptor are
       all-ones, load from the buffer descriptors in the table indexed by the
@@ -1147,7 +1188,8 @@
     <src size="32">Mode descriptor</src>
   </ins>
 
-  <ins name="LD_PKA.i16" title="Global memory load" message="load" opcode="0x6a" opcode2="1" unit="LS">
+  <ins name="LD_PKA.i16" title="Global memory load" message="load" opcode2="1" unit="LS">
+    <opcode val="0x6A" start="48" mask="0x1FF"/>
     <desc>
       Loads a buffer descriptor. If bits 25...31 of the mode descriptor are
       all-ones, load from the buffer descriptors in the table indexed by the
@@ -1164,7 +1206,8 @@
     <src size="32">Mode descriptor</src>
   </ins>
 
-  <ins name="LD_PKA.i24" title="Global memory load" message="load" opcode="0x6a" opcode2="2" unit="LS">
+  <ins name="LD_PKA.i24" title="Global memory load" message="load" opcode2="2" unit="LS">
+    <opcode val="0x6A" start="48" mask="0x1FF"/>
     <desc>
       Loads a buffer descriptor. If bits 25...31 of the mode descriptor are
       all-ones, load from the buffer descriptors in the table indexed by the
@@ -1181,7 +1224,8 @@
     <src size="32">Mode descriptor</src>
   </ins>
 
-  <ins name="LD_PKA.i32" title="Global memory load" message="load" opcode="0x6a" opcode2="3" unit="LS">
+  <ins name="LD_PKA.i32" title="Global memory load" message="load" opcode2="3" unit="LS">
+    <opcode val="0x6A" start="48" mask="0x1FF"/>
     <desc>
       Loads a buffer descriptor. If bits 25...31 of the mode descriptor are
       all-ones, load from the buffer descriptors in the table indexed by the
@@ -1198,7 +1242,8 @@
     <src size="32">Mode descriptor</src>
   </ins>
 
-  <ins name="LD_PKA.i48" title="Global memory load" message="load" opcode="0x6a" opcode2="4" unit="LS">
+  <ins name="LD_PKA.i48" title="Global memory load" message="load" opcode2="4" unit="LS">
+    <opcode val="0x6A" start="48" mask="0x1FF"/>
     <desc>
       Loads a buffer descriptor. If bits 25...31 of the mode descriptor are
       all-ones, load from the buffer descriptors in the table indexed by the
@@ -1215,7 +1260,8 @@
     <src size="32">Mode descriptor</src>
   </ins>
 
-  <ins name="LD_PKA.i64" title="Global memory load" message="load" opcode="0x6a" opcode2="5" unit="LS">
+  <ins name="LD_PKA.i64" title="Global memory load" message="load" opcode2="5" unit="LS">
+    <opcode val="0x6A" start="48" mask="0x1FF"/>
     <desc>
       Loads a buffer descriptor. If bits 25...31 of the mode descriptor are
       all-ones, load from the buffer descriptors in the table indexed by the
@@ -1232,7 +1278,8 @@
     <src size="32">Mode descriptor</src>
   </ins>
 
-  <ins name="LD_PKA.i96" title="Global memory load" message="load" opcode="0x6a" opcode2="6" unit="LS">
+  <ins name="LD_PKA.i96" title="Global memory load" message="load" opcode2="6" unit="LS">
+    <opcode val="0x6A" start="48" mask="0x1FF"/>
     <desc>
       Loads a buffer descriptor. If bits 25...31 of the mode descriptor are
       all-ones, load from the buffer descriptors in the table indexed by the
@@ -1249,7 +1296,8 @@
     <src size="32">Mode descriptor</src>
   </ins>
 
-  <ins name="LD_PKA.i128" title="Global memory load" message="load" opcode="0x6a" opcode2="7" unit="LS">
+  <ins name="LD_PKA.i128" title="Global memory load" message="load" opcode2="7" unit="LS">
+    <opcode val="0x6A" start="48" mask="0x1FF"/>
     <desc>
       Loads a buffer descriptor. If bits 25...31 of the mode descriptor are
       all-ones, load from the buffer descriptors in the table indexed by the
@@ -1267,7 +1315,8 @@
   </ins>
 
 
-  <ins name="LEA_BUF" title="Load buffer effective address" message="attribute" opcode="0x6E" unit="LS">
+  <ins name="LEA_BUF" title="Load buffer effective address" message="attribute" unit="LS">
+    <opcode val="0x6E" start="48" mask="0x1FF"/>
     <desc>
       Load effective address of a buffer with an offset added.
     </desc>
@@ -1278,7 +1327,8 @@
     <src size="32">Mode descriptor</src>
   </ins>
 
-  <ins name="LEA_BUF_IMM" title="Load buffer effective address" message="attribute" opcode="0x5E" unit="LS">
+  <ins name="LEA_BUF_IMM" title="Load buffer effective address" message="attribute" unit="LS">
+    <opcode val="0x5E" start="48" mask="0x1FF"/>
     <desc>
       Load effective address of a buffer with an immediate offset added.
     </desc>
@@ -1290,7 +1340,8 @@
     <src size="32">Structure index</src>
   </ins>
 
-  <ins name="LOAD.i8" title="Global memory load" opcode="0x60" opcode2="0" unused="true" unit="LS">
+  <ins name="LOAD.i8" title="Global memory load" opcode2="0" unused="true" unit="LS">
+    <opcode val="0x60" start="48" mask="0x1FF"/>
     <desc>Loads from main memory</desc>
     <sr write="true"/>
     <memory_access/>
@@ -1302,7 +1353,8 @@
     <imm name="offset" start="8" size="16" signed="true"/>
   </ins>
 
-  <ins name="LOAD.i16" title="Global memory load" opcode="0x60" opcode2="1" unused="true" unit="LS">
+  <ins name="LOAD.i16" title="Global memory load" opcode2="1" unused="true" unit="LS">
+    <opcode val="0x60" start="48" mask="0x1FF"/>
     <desc>Loads from main memory</desc>
     <sr write="true"/>
     <memory_access/>
@@ -1314,7 +1366,8 @@
     <imm name="offset" start="8" size="16" signed="true"/>
   </ins>
 
-  <ins name="LOAD.i24" title="Global memory load" opcode="0x60" opcode2="2" unused="true" unit="LS">
+  <ins name="LOAD.i24" title="Global memory load" opcode2="2" unused="true" unit="LS">
+    <opcode val="0x60" start="48" mask="0x1FF"/>
     <desc>Loads from main memory</desc>
     <sr write="true"/>
     <memory_access/>
@@ -1326,7 +1379,8 @@
     <imm name="offset" start="8" size="16" signed="true"/>
   </ins>
 
-  <ins name="LOAD.i32" title="Global memory load" opcode="0x60" opcode2="3" unused="true" unit="LS">
+  <ins name="LOAD.i32" title="Global memory load" opcode2="3" unused="true" unit="LS">
+    <opcode val="0x60" start="48" mask="0x1FF"/>
     <desc>Loads from main memory</desc>
     <sr write="true"/>
     <memory_access/>
@@ -1338,7 +1392,8 @@
     <imm name="offset" start="8" size="16" signed="true"/>
   </ins>
 
-  <ins name="LOAD.i48" title="Global memory load" opcode="0x60" opcode2="4" unused="true" unit="LS">
+  <ins name="LOAD.i48" title="Global memory load" opcode2="4" unused="true" unit="LS">
+    <opcode val="0x60" start="48" mask="0x1FF"/>
     <desc>Loads from main memory</desc>
     <sr write="true"/>
     <memory_access/>
@@ -1350,7 +1405,8 @@
     <imm name="offset" start="8" size="16" signed="true"/>
   </ins>
 
-  <ins name="LOAD.i64" title="Global memory load" opcode="0x60" opcode2="5" unused="true" unit="LS">
+  <ins name="LOAD.i64" title="Global memory load" opcode2="5" unused="true" unit="LS">
+    <opcode val="0x60" start="48" mask="0x1FF"/>
     <desc>Loads from main memory</desc>
     <sr write="true"/>
     <memory_access/>
@@ -1362,7 +1418,8 @@
     <imm name="offset" start="8" size="16" signed="true"/>
   </ins>
 
-  <ins name="LOAD.i96" title="Global memory load" opcode="0x60" opcode2="6" unused="true" unit="LS">
+  <ins name="LOAD.i96" title="Global memory load" opcode2="6" unused="true" unit="LS">
+    <opcode val="0x60" start="48" mask="0x1FF"/>
     <desc>Loads from main memory</desc>
     <sr write="true"/>
     <memory_access/>
@@ -1374,7 +1431,8 @@
     <imm name="offset" start="8" size="16" signed="true"/>
   </ins>
 
-  <ins name="LOAD.i128" title="Global memory load" opcode="0x60" opcode2="7" unused="true" unit="LS">
+  <ins name="LOAD.i128" title="Global memory load" opcode2="7" unused="true" unit="LS">
+    <opcode val="0x60" start="48" mask="0x1FF"/>
     <desc>Loads from main memory</desc>
     <sr write="true"/>
     <memory_access/>
@@ -1386,7 +1444,8 @@
     <imm name="offset" start="8" size="16" signed="true"/>
   </ins>
 
-  <group name="STORE" title="Global memory store" opcode="0x61" unused="true" unit="LS">
+  <group name="STORE" title="Global memory store" unused="true" unit="LS">
+    <opcode val="0x61" start="48" mask="0x1FF"/>
     <desc>Stores to main memory</desc>
     <sr read="true"/>
     <ins name="STORE.i8" opcode2="0x0"/>
@@ -1404,7 +1463,8 @@
     <imm name="offset" start="8" size="16" signed="true"/>
   </group>
 
-  <ins name="LEA_PKA" title="Load buffer effective address" message="attribute" opcode="0x6B" unit="LS">
+  <ins name="LEA_PKA" title="Load buffer effective address" message="attribute" unit="LS">
+    <opcode val="0x6B" start="48" mask="0x1FF"/>
     <desc>
       Load effective address of a simple buffer with an offset added.
     </desc>
@@ -1415,7 +1475,8 @@
     <src>Index</src>
   </ins>
 
-  <ins name="LD_CVT" title="Load with conversion" opcode="0x70" unused="true" unit="LS">
+  <ins name="LD_CVT" title="Load with conversion" unused="true" unit="LS">
+    <opcode val="0x70" start="48" mask="0x1FF"/>
     <desc>
       Load from memory with data conversion. The address to load from is given in
       the first source, which must be a 64-bit register (a pair of 32-bit
@@ -1432,7 +1493,8 @@
     <src>Internal conversion descriptor</src>
   </ins>
 
-  <ins name="ST_CVT" title="Store with conversion" opcode="0x71" unused="true" unit="LS">
+  <ins name="ST_CVT" title="Store with conversion" unused="true" unit="LS">
+    <opcode val="0x71" start="48" mask="0x1FF"/>
     <desc>
       Store to memory with data conversion. The address to store to is given in
       the first source, which must be a 64-bit register (a pair of 32-bit
@@ -1451,7 +1513,8 @@
     <src>Internal conversion descriptor</src>
   </ins>
 
-  <ins name="LD_TILE" title="Load from tilebuffer" opcode="0x78" unused="true" unit="NONE">
+  <ins name="LD_TILE" title="Load from tilebuffer" unused="true" unit="NONE">
+    <opcode val="0x78" start="48" mask="0x1FF"/>
     <desc>
       Loads a given render target, specified in the pixel indices descriptor, at
       a given location and sample, and convert to the format specified in the
@@ -1468,7 +1531,8 @@
     <src>Conversion descriptor</src>
   </ins>
 
-  <ins name="ST_TILE" title="Store to tilebuffer" opcode="0x79" unused="true" unit="NONE">
+  <ins name="ST_TILE" title="Store to tilebuffer" unused="true" unit="NONE">
+    <opcode val="0x79" start="48" mask="0x1FF"/>
     <desc>
       Store to given render target, specified in the pixel indices descriptor, at
       a given location and sample, and convert to the format specified in the
@@ -1484,7 +1548,8 @@
     <src>Conversion descriptor</src>
   </ins>
 
-  <ins name="BLEND" title="Blend render target" opcode="0x7F" unused="true" unit="NONE">
+  <ins name="BLEND" title="Blend render target" unused="true" unit="NONE">
+    <opcode val="0x7F" start="48" mask="0x1FF"/>
     <desc>
       Blends a given render target. This loads the API-specified blend state for
       the render target from the first source. Blend descriptors are available
@@ -1520,7 +1585,8 @@
     <regfmt/>
   </ins>
 
-  <ins name="ATEST" title="Alpha test" opcode="0x7D" unused="true" unit="NONE">
+  <ins name="ATEST" title="Alpha test" unused="true" unit="NONE">
+    <opcode val="0x7D" start="48" mask="0x1FF"/>
     <desc>
       Does alpha-to-coverage testing, updating the sample coverage mask. ATEST
       does not do an implicit discard. It should be executed before the first
@@ -1533,7 +1599,8 @@
     <sr_count/>
   </ins>
 
-  <ins name="ZS_EMIT" title="Depth/stencil write" opcode="0x7E" unused="true" unit="NONE">
+  <ins name="ZS_EMIT" title="Depth/stencil write" unused="true" unit="NONE">
+    <opcode val="0x7E" start="48" mask="0x1FF"/>
     <desc>
       Programatically writes out depth, stencil, or both, depending on which
       modifiers are set. Used to implement gl_FragDepth and gl_FragStencil.
@@ -1548,7 +1615,8 @@
     <slot/>
   </ins>
 
-  <group name="CONVERT" title="Data conversions" dests="1" opcode="0x90" unused="true" unit="CVT">
+  <group name="CONVERT" title="Data conversions" dests="1" unused="true" unit="CVT">
+    <opcode val="0x90" start="48" mask="0x1FF"/>
     <desc>
       Performs the given data conversion. Note that floating-point rounding is
       handled via the same hardware and therefore shares an encoding. Round mode
@@ -1569,7 +1637,8 @@
     <src widen="true">Value to convert</src>
   </group>
 
-  <group name="CONVERT" title="16->32 integer data conversions" dests="1" opcode="0x90" unused="true" unit="CVT">
+  <group name="CONVERT" title="16->32 integer data conversions" dests="1" unused="true" unit="CVT">
+    <opcode val="0x90" start="48" mask="0x1FF"/>
     <desc>
       Performs the given data conversion.
     </desc>
@@ -1586,7 +1655,8 @@
     <src swizzle="true" size="16">Value to convert</src>
   </group>
 
-  <group name="CONVERT" title="Float-to-int data conversions" dests="1" opcode="0x90" unused="true" unit="CVT">
+  <group name="CONVERT" title="Float-to-int data conversions" dests="1" unused="true" unit="CVT">
+    <opcode val="0x90" start="48" mask="0x1FF"/>
     <desc>Performs the given data conversion.</desc>
     <ins name="F32_TO_S32" opcode2="0xC"/>
     <ins name="F32_TO_U32" opcode2="0x1C"/>
@@ -1594,7 +1664,8 @@
     <src absneg="true">Value to convert</src>
   </group>
 
-  <group name="CONVERT" title="Float-to-int data conversions" dests="1" opcode="0x90" unused="true" unit="CVT">
+  <group name="CONVERT" title="Float-to-int data conversions" dests="1" unused="true" unit="CVT">
+    <opcode val="0x90" start="48" mask="0x1FF"/>
     <desc>Performs the given data conversion.</desc>
     <!-- Removed on v11 -->
     <ins name="V2F16_TO_V2S16" opcode2="0xE"/>
@@ -1608,13 +1679,15 @@
     <src swizzle="true" absneg="true" size="16">Value to convert</src>
   </group>
 
-  <ins name="F16_TO_F32" title="16-bit float to 32-bit float conversion" dests="1" opcode="0x90" opcode2="0xB" unused="true" unit="CVT">
+  <ins name="F16_TO_F32" title="16-bit float to 32-bit float conversion" dests="1" opcode2="0xB" unused="true" unit="CVT">
+    <opcode val="0x90" start="48" mask="0x1FF"/>
     <desc>Converts up with the specified round mode.</desc>
     <roundmode/>
     <src lane="28" size="16" absneg="true">Value to convert</src>
   </ins>
 
-  <group name="CONVERT" title="8-bit to 32-bit data conversions" dests="1" opcode="0x90" unused="true" unit="CVT">
+  <group name="CONVERT" title="8-bit to 32-bit data conversions" dests="1" unused="true" unit="CVT">
+    <opcode val="0x90" start="48" mask="0x1FF"/>
     <desc>
       Performs the given data conversion.
     </desc>
@@ -1632,7 +1705,8 @@
     <src lane="28" size="8">Value to convert</src>
   </group>
 
-  <group name="CONVERT" title="8-bit to 16-bit data conversions" dests="1" opcode="0x90" unused="true" unit="CVT">
+  <group name="CONVERT" title="8-bit to 16-bit data conversions" dests="1" unused="true" unit="CVT">
+    <opcode val="0x90" start="48" mask="0x1FF"/>
     <desc>
       Performs the given data conversion.
     </desc>
@@ -1649,7 +1723,8 @@
     <src halfswizzle="true" size="8">Value to convert</src>
   </group>
 
-  <group name="FROUND" title="Floating-point rounding" dests="1" opcode="0x90" unused="true" unit="CVT">
+  <group name="FROUND" title="Floating-point rounding" dests="1" unused="true" unit="CVT">
+    <opcode val="0x90" start="48" mask="0x1FF"/>
     <desc>
       Performs the given rounding, using the convert unit.
     </desc>
@@ -1663,33 +1738,38 @@
     <src swizzle="true" absneg="true">Value to convert</src>
   </group>
 
-  <ins name="MOV.i32" title="Register move" dests="1" opcode="0x91" opcode2="0x0" unused="true" unit="CVT">
+  <ins name="MOV.i32" title="Register move" dests="1" opcode2="0x0" unused="true" unit="CVT">
+    <opcode val="0x91" start="48" mask="0x1FF"/>
     <desc>Canonical register-to-register move.</desc>
     <src/>
   </ins>
 
-  <ins name="CLZ.u32" title="Count leading zeroes" dests="1" opcode="0x91" opcode2="0x4" unused="true" unit="CVT">
+  <ins name="CLZ.u32" title="Count leading zeroes" dests="1" opcode2="0x4" unused="true" unit="CVT">
+    <opcode val="0x91" start="48" mask="0x1FF"/>
     <desc>
       Used as a primitive for various bitwise operations.
     </desc>
     <src/>
   </ins>
 
-  <ins name="CLZ.v2u16" title="Count leading zeroes" dests="1" opcode="0x91" opcode2="0x5" unused="true" unit="CVT">
+  <ins name="CLZ.v2u16" title="Count leading zeroes" dests="1" opcode2="0x5" unused="true" unit="CVT">
+    <opcode val="0x91" start="48" mask="0x1FF"/>
     <desc>
       Used as a primitive for various bitwise operations.
     </desc>
     <src swizzle="true"/>
   </ins>
 
-  <ins name="CLZ.v4u8" title="Count leading zeroes" dests="1" opcode="0x91" opcode2="0x6" unused="true" unit="CVT">
+  <ins name="CLZ.v4u8" title="Count leading zeroes" dests="1" opcode2="0x6" unused="true" unit="CVT">
+    <opcode val="0x91" start="48" mask="0x1FF"/>
     <desc>
       Used as a primitive for various bitwise operations.
     </desc>
     <src/>
   </ins>
 
-  <ins name="IABS.s32" title="Absolute value" dests="1" opcode="0x91" opcode2="0x8" unused="true" unit="CVT">
+  <ins name="IABS.s32" title="Absolute value" dests="1" opcode2="0x8" unused="true" unit="CVT">
+    <opcode val="0x91" start="48" mask="0x1FF"/>
     <desc>
       64-bit abs may be constructed in 4 instructions (5 clocks) by checking the
       sign with `ICMP.s32.lt.m1 hi, 0` and negating based on the result with
@@ -1698,16 +1778,19 @@
     <src widen="true"/>
   </ins>
 
-  <ins name="IABS.v2s16" title="Absolute value" dests="1" opcode="0x91" opcode2="0x9" unused="true" unit="CVT">
+  <ins name="IABS.v2s16" title="Absolute value" dests="1" opcode2="0x9" unused="true" unit="CVT">
+    <opcode val="0x91" start="48" mask="0x1FF"/>
     <src widen="true"/>
   </ins>
 
   <!-- Removed on v11 -->
-  <ins name="IABS.v4s8" title="Absolute value" dests="1" opcode="0x91" opcode2="0xa" unused="true" unit="CVT">
+  <ins name="IABS.v4s8" title="Absolute value" dests="1" opcode2="0xa" unused="true" unit="CVT">
+    <opcode val="0x91" start="48" mask="0x1FF"/>
     <src/>
   </ins>
 
-  <ins name="POPCOUNT.i32" title="Population count" dests="1" opcode="0x91" opcode2="0xC" unused="true" unit="SFU">
+  <ins name="POPCOUNT.i32" title="Population count" dests="1" opcode2="0xC" unused="true" unit="SFU">
+    <opcode val="0x91" start="48" mask="0x1FF"/>
     <desc>
       Only available as 32-bit. Smaller bitsizes require explicit conversions.
       64-bit popcount may be constructed in 3 clocks by separate 32-bit
@@ -1717,28 +1800,32 @@
     <src/>
   </ins>
 
-  <ins name="BITREV.i32" title="Bitwise reverse" dests="1" opcode="0x91" opcode2="0xD" unused="true" unit="SFU">
+  <ins name="BITREV.i32" title="Bitwise reverse" dests="1" opcode2="0xD" unused="true" unit="SFU">
+    <opcode val="0x91" start="48" mask="0x1FF"/>
     <desc>
       Only available as 32-bit. Other bitsizes may be derived with swizzles.
     </desc>
     <src/>
   </ins>
 
-  <ins name="NOT_OLD.i32" title="Bitwise complement" dests="1" opcode="0x91" opcode2="0xE" unused="true" unit="SFU">
+  <ins name="NOT_OLD.i32" title="Bitwise complement" dests="1" opcode2="0xE" unused="true" unit="SFU">
+    <opcode val="0x91" start="48" mask="0x1FF"/>
     <desc>
       For fully featured bitwise operation, see the shift opcodes.
     </desc>
     <src/>
   </ins>
 
-  <ins name="NOT_OLD.i64" title="Bitwise complement" dests="1" opcode="0x191" opcode2="0xE" unused="true" unit="SFU">
+  <ins name="NOT_OLD.i64" title="Bitwise complement" dests="1" opcode2="0xE" unused="true" unit="SFU">
+    <opcode val="0x191" start="48" mask="0x1FF"/>
     <desc>
       For fully featured bitwise operation, see the shift opcodes.
     </desc>
     <src/>
   </ins>
 
-  <ins name="WMASK" title="Warp mask" dests="1" opcode="0x95" unused="true" unit="CVT">
+  <ins name="WMASK" title="Warp mask" dests="1" unused="true" unit="CVT">
+    <opcode val="0x95" start="48" mask="0x1FF"/>
     <desc>
       Returns the mask of lanes ever active within the warp (subgroup), such
       that the source is nonzero. The number of work-items in a subgroup is
@@ -1754,7 +1841,8 @@
     <subgroup/>
   </ins>
 
-  <group name = "FLUSH" title="Flush floats" dests="1" opcode="0x98" unit="CVT">
+  <group name = "FLUSH" title="Flush floats" dests="1" unit="CVT">
+    <opcode val="0x98" start="48" mask="0x1FF"/>
     <ins name="FLUSH.f32" opcode2="0"/>
     <ins name="FLUSH.v2f16" opcode2="1"/>
     <desc>
@@ -1769,7 +1857,8 @@
     <src float="true" absneg="true" swizzle="true"/>
   </group>
 
-  <group name="FREXP" title="Fraction/exponent extract" dests="1" opcode="0x99" unused="true" unit="CVT">
+  <group name="FREXP" title="Fraction/exponent extract" dests="1" unused="true" unit="CVT">
+    <opcode val="0x99" start="48" mask="0x1FF"/>
     <ins name="FREXPM.f32" opcode2="0"/>
     <!-- Removed on v11 -->
     <ins name="FREXPM.v2f16" opcode2="1"/>
@@ -1788,7 +1877,8 @@
     <src float="true" swizzle="true"/>
   </group>
 
-  <group name="SFU" title="Special function unit" dests="1" opcode="0x9C" unused="true" unit="SFU">
+  <group name="SFU" title="Special function unit" dests="1" unused="true" unit="SFU">
+    <opcode val="0x9C" start="48" mask="0x1FF"/>
     <ins name="FRCP.f32" opcode2="0"/>
     <ins name="FRCP.f16" opcode2="1"/>
     <ins name="FRSQ.f32" opcode2="2"/>
@@ -1810,7 +1900,8 @@
     <src float="true" swizzle="true" absneg="true"/>
   </group>
 
-  <group name="SFU" title="Special function unit" dests="1" opcode="0x9C" unused="true" unit="SFU">
+  <group name="SFU" title="Special function unit" dests="1" unused="true" unit="SFU">
+    <opcode val="0x9C" start="48" mask="0x1FF"/>
     <ins name="FSIN_TABLE.u6" opcode2="4"/>
     <ins name="FCOS_TABLE.u6" opcode2="5"/>
     <ins name="FSINCOS_OFFSET.u6" opcode2="6"/>
@@ -1824,8 +1915,12 @@
   </group>
 
   <group name="FADD" title="Floating-point add" dests="1" opcode2="0" unused="true" unit="FMA">
-    <ins name="FADD.f32" opcode="0xA4"/>
-    <ins name="FADD.v2f16" opcode="0xA5"/>
+    <ins name="FADD.f32">
+      <opcode val="0xA4" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="FADD.v2f16">
+      <opcode val="0xA5" start="48" mask="0x1FF"/>
+    </ins>
     <desc>$A + B$</desc>
     <roundmode/>
     <clamp/>
@@ -1835,8 +1930,12 @@
   </group>
 
   <group name="FMIN" title="Floating-point minimum" dests="1" opcode2="2" unused="true" unit="CVT">
-    <ins name="FMIN.f32" opcode="0xA4"/>
-    <ins name="FMIN.v2f16" opcode="0xA5"/>
+    <ins name="FMIN.f32">
+      <opcode val="0xA4" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="FMIN.v2f16">
+      <opcode val="0xA5" start="48" mask="0x1FF"/>
+    </ins>
     <desc>$\min \{ A, B \}$</desc>
     <clamp/>
     <src absneg="true" swizzle="true">A</src>
@@ -1844,8 +1943,12 @@
   </group>
 
   <group name="FMAX" title="Floating-point maximum" dests="1" opcode2="3" unused="true" unit="CVT">
-    <ins name="FMAX.f32" opcode="0xA4"/>
-    <ins name="FMAX.v2f16" opcode="0xA5"/>
+    <ins name="FMAX.f32">
+      <opcode val="0xA4" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="FMAX.v2f16">
+      <opcode val="0xA5" start="48" mask="0x1FF"/>
+    </ins>
     <desc>$\max \{ A, B \}$</desc>
     <clamp/>
     <src absneg="true" swizzle="true">A</src>
@@ -1854,7 +1957,9 @@
 
   <!-- Removed on v11 -->
   <group name="V2F32_TO_V2F16" title="Vectorized floating-point conversion" dests="1" opcode2="4" unused="true" unit="CVT">
-    <ins name="V2F32_TO_V2F16" opcode="0xA5"/>
+    <ins name="V2F32_TO_V2F16">
+      <opcode val="0xA5" start="48" mask="0x1FF"/>
+    </ins>
     <desc>
       Given a pair of 32-bit floats, output a pair of 16-bit floats packed into
       a 32-bit destination.
@@ -1866,8 +1971,12 @@
   </group>
 
   <group name="LDEXP" title="Floating-point rescaling" dests="1" opcode2="6" unused="true" unit="FMA">
-    <ins name="LDEXP.f32" opcode="0xA4"/>
-    <ins name="LDEXP.v2f16" opcode="0xA5"/>
+    <ins name="LDEXP.f32">
+      <opcode val="0xA4" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="LDEXP.v2f16">
+      <opcode val="0xA5" start="48" mask="0x1FF"/>
+    </ins>
     <desc>
       Computes $A \cdot 2^B$ by adding B to the exponent of A. Used to calculate
       various special functions, particularly base-2 exponents. Special case
@@ -1880,7 +1989,8 @@
     <!-- Also has infinity handling for arctan -->
   </group>
 
-  <ins name="FEXP.f32" title="Floating-point exponent" dests="1" opcode="0xA4" opcode2="8" unused="true" unit="SFU">
+  <ins name="FEXP.f32" title="Floating-point exponent" dests="1" opcode2="8" unused="true" unit="SFU">
+    <opcode val="0xA4" start="48" mask="0x1FF"/>
     <desc>
       Calculates the base-2 exponent of an argument specified as a 8:24
       fixed-point. The original argument is passed as well for correct handling
@@ -1891,7 +2001,8 @@
     <src absneg="true">Input as 32-bit float</src>
   </ins>
 
-  <ins name="FADD_LSCALE.f32" title="Floating-point add with logarithm scale" dests="1" opcode="0xA4" opcode2="9" unused="true" unit="FMA">
+  <ins name="FADD_LSCALE.f32" title="Floating-point add with logarithm scale" dests="1" opcode2="9" unused="true" unit="FMA">
+    <opcode val="0xA4" start="48" mask="0x1FF"/>
     <desc>
       Performs a floating-point addition specialized for logarithm computation.
     </desc>
@@ -1900,7 +2011,8 @@
     <src absneg="true">B</src>
   </ins>
 
-  <ins name="FATAN_ASSIST.f32" title="ATAN calculation helper" dests="1" opcode="0xA4" opcode2="14" unused="true" unit="SFU">
+  <ins name="FATAN_ASSIST.f32" title="ATAN calculation helper" dests="1" opcode2="14" unused="true" unit="SFU">
+    <opcode val="0xA4" start="48" mask="0x1FF"/>
     <desc>
       Used for `atan2()` implementation. Destination is two 16-bit
       values (int and float) for the first form, and a single 32-bit float when
@@ -1918,38 +2030,71 @@
       As Valhall lacks swizzle instructions, `IADD.v2i16` with zero is the
       canonical lowering for swizzles.
     </desc>
-    <ins name="IADD.u32" opcode="0xA0"/>
-    <ins name="IADD.v2u16" opcode="0xA1"/>
+    <ins name="IADD.u32">
+      <opcode val="0xA0" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="IADD.v2u16">
+      <opcode val="0xA1" start="48" mask="0x1FF"/>
+    </ins>
     <!-- Removed on v11 -->
-    <ins name="IADD.v4u8" opcode="0xA2"/>
-    <ins name="IADD.s32" opcode="0xA8"/>
-    <ins name="IADD.v2s16" opcode="0xA9"/>
+    <ins name="IADD.v4u8">
+      <opcode val="0xA2" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="IADD.s32">
+      <opcode val="0xA8" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="IADD.v2s16">
+      <opcode val="0xA9" start="48" mask="0x1FF"/>
+    </ins>
     <!-- Removed on v11 -->
-    <ins name="IADD.v4s8" opcode="0xAA"/>
-    <ins name="IADD.u64" opcode="0x1A3"/>
-    <ins name="IADD.s64" opcode="0x1AB"/>
+    <ins name="IADD.v4s8">
+      <opcode val="0xAA" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="IADD.u64">
+      <opcode val="0x1A3" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="IADD.s64">
+      <opcode val="0x1AB" start="48" mask="0x1FF"/>
+    </ins>
     <src widen="true">A</src>
     <src widen="true">B</src>
     <saturate/>
   </group>
 
-  <ins name="MKVEC.v2i16" title="Make 16-bit vector" dests="1" opcode="0xA1" opcode2="0x5" unused="true" unit="CVT">
+  <ins name="MKVEC.v2i16" title="Make 16-bit vector" dests="1" opcode2="0x5" unused="true" unit="CVT">
+    <opcode val="0xA1" start="48" mask="0x1FF"/>
     <desc>Calculates $A | (B \ll 16)$. Used to implement `(ushort2)(A, B)`</desc>
     <src lane="28">A</src>
     <src lane="26">B</src>
   </ins>
 
   <group name="ISUB" title="Integer subtract" dests="1" opcode2="1" unused="true" unit="CVT">
-    <ins name="ISUB.u32" opcode="0xA0"/>
-    <ins name="ISUB.v2u16" opcode="0xA1"/>
+    <ins name="ISUB.u32">
+      <opcode val="0xA0" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="ISUB.v2u16">
+      <opcode val="0xA1" start="48" mask="0x1FF"/>
+    </ins>
     <!-- Removed on v11 -->
-    <ins name="ISUB.v4u8" opcode="0xA2"/>
-    <ins name="ISUB.s32" opcode="0xA8"/>
-    <ins name="ISUB.v2s16" opcode="0xA9"/>
+    <ins name="ISUB.v4u8">
+      <opcode val="0xA2" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="ISUB.s32">
+      <opcode val="0xA8" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="ISUB.v2s16">
+      <opcode val="0xA9" start="48" mask="0x1FF"/>
+    </ins>
     <!-- Removed on v11 -->
-    <ins name="ISUB.v4s8" opcode="0xAA"/>
-    <ins name="ISUB.u64" opcode="0x1A3"/>
-    <ins name="ISUB.s64" opcode="0x1AB"/>
+    <ins name="ISUB.v4s8">
+      <opcode val="0xAA" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="ISUB.u64">
+      <opcode val="0x1A3" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="ISUB.s64">
+      <opcode val="0x1AB" start="48" mask="0x1FF"/>
+    </ins>
     <desc>$A - B$ with optional saturation</desc>
     <src widen="true">A</src>
     <src widen="true">B</src>
@@ -1964,7 +2109,9 @@
 
       .neg indicates SEG_SUB instead.
     </desc>
-    <ins name="SEG_ADD.u64" opcode="0x1A3"/>
+    <ins name="SEG_ADD.u64">
+      <opcode val="0x1A3" start="48" mask="0x1FF"/>
+    </ins>
     <va_mod name="neg" start="38" size="1"/>
     <va_mod name="preserve_null" start="39" size="1"/>
     <src>A</src>
@@ -1977,21 +2124,39 @@
       64-bit value A. These instructions accelerate address arithmetic, but may
       be used in full generality for 64-bit integer arithmetic.
     </desc>
-    <ins name="SHADDX.u64" opcode="0x1A3"/>
-    <ins name="SHADDX.s64" opcode="0x1AB"/>
+    <ins name="SHADDX.u64">
+      <opcode val="0x1A3" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="SHADDX.s64">
+      <opcode val="0x1AB" start="48" mask="0x1FF"/>
+    </ins>
     <imm name="shift" start="20" size="3"/>
     <src>A</src>
     <src widen="true">B</src>
   </group>
 
   <group name="IMUL" title="Integer multiply" dests="1" opcode2="0x0A" unused="true" unit="SFU">
-    <ins name="IMUL.i32" opcode="0xA0"/>
-    <ins name="IMUL.v2i16" opcode="0xA1"/>
-    <ins name="IMUL.v4i8" opcode="0xA2"/>
-    <ins name="IMUL.s32" opcode="0xA8"/>
-    <ins name="IMUL.v2s16" opcode="0xA9"/>
-    <ins name="IMUL.v4s8" opcode="0xAA"/>
-    <ins name="IMULD.u64" opcode="0x1A3"/>
+    <ins name="IMUL.i32">
+      <opcode val="0xA0" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="IMUL.v2i16">
+      <opcode val="0xA1" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="IMUL.v4i8">
+      <opcode val="0xA2" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="IMUL.s32">
+      <opcode val="0xA8" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="IMUL.v2s16">
+      <opcode val="0xA9" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="IMUL.v4s8">
+      <opcode val="0xAA" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="IMULD.u64">
+      <opcode val="0x1A3" start="48" mask="0x1FF"/>
+    </ins>
     <desc>
       $A \cdot B$ with optional saturation. Note the multipliers can only handle up to
       32-bit by 32-bit multiplies. The 64-bit "multiply" acts like IMUL.u32 but
@@ -2006,12 +2171,24 @@
 
   <!-- Removed on v11 -->
   <group name="HADD" title="Integer half-add" dests="1" opcode2="0x0B" unused="true" unit="CVT">
-    <ins name="HADD.u32" opcode="0xA0"/>
-    <ins name="HADD.v2u16" opcode="0xA1"/>
-    <ins name="HADD.v4u8" opcode="0xA2"/>
-    <ins name="HADD.s32" opcode="0xA8"/>
-    <ins name="HADD.v2s16" opcode="0xA9"/>
-    <ins name="HADD.v4s8" opcode="0xAA"/>
+    <ins name="HADD.u32">
+      <opcode val="0xA0" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="HADD.v2u16">
+      <opcode val="0xA1" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="HADD.v4u8">
+      <opcode val="0xA2" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="HADD.s32">
+      <opcode val="0xA8" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="HADD.v2s16">
+      <opcode val="0xA9" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="HADD.v4s8">
+      <opcode val="0xAA" start="48" mask="0x1FF"/>
+    </ins>
     <va_mod name="rhadd" start="30" size="1"/>
     <src widen="true">A</src>
     <src widen="true">B</src>
@@ -2022,7 +2199,8 @@
     </desc>
   </group>
 
-  <ins name="CLPER.i32" title="Cross-lane permute" dests="1" opcode="0xA0" opcode2="0xF" unused="true" unit="SFU">
+  <ins name="CLPER.i32" title="Cross-lane permute" dests="1" opcode2="0xF" unused="true" unit="SFU">
+    <opcode val="0xA0" start="48" mask="0x1FF"/>
     <desc>
       Selects the value of A in the subgroup lane given by B. This implements
       subgroup broadcasts. It may be used as a primitive for screen space
@@ -2036,8 +2214,12 @@
   </ins>
 
   <group name="FMA" title="Fused floating-point multiply add" dests="1" unused="true" unit="FMA">
-    <ins name="FMA.f32" opcode="0xB2"/>
-    <ins name="FMA.v2f16" opcode="0xB3"/>
+    <ins name="FMA.f32">
+      <opcode val="0xB2" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="FMA.v2f16">
+      <opcode val="0xB3" start="48" mask="0x1FF"/>
+    </ins>
     <desc>$A \cdot B + C$</desc>
     <clamp/>
     <roundmode/>
@@ -2047,10 +2229,18 @@
   </group>
 
   <group name="LSHIFT_AND" title="Left shift and bitwise AND" dests="1" opcode2="0x100" unused="true" unit="SFU">
-    <ins name="LSHIFT_AND.i32" opcode="0xB4"/>
-    <ins name="LSHIFT_AND.v2i16" opcode="0xB5"/>
-    <ins name="LSHIFT_AND.v4i8" opcode="0xB6"/>
-    <ins name="LSHIFT_AND.i64" opcode="0x1B7"/>
+    <ins name="LSHIFT_AND.i32">
+      <opcode val="0xB4" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="LSHIFT_AND.v2i16">
+      <opcode val="0xB5" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="LSHIFT_AND.v4i8">
+      <opcode val="0xB6" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="LSHIFT_AND.i64">
+      <opcode val="0x1B7" start="48" mask="0x1FF"/>
+    </ins>
     <va_mod name="left" start="128" size="1" implied="true"/>
     <desc>
       Left shifts its first source by a specified amount and bitwise ANDs it with the
@@ -2063,10 +2253,18 @@
   </group>
 
   <group name="RSHIFT_AND" title="Right shift and bitwise AND" dests="1" opcode2="0x000" unused="true" unit="SFU">
-    <ins name="RSHIFT_AND.i32" opcode="0xB4"/>
-    <ins name="RSHIFT_AND.v2i16" opcode="0xB5"/>
-    <ins name="RSHIFT_AND.v4i8" opcode="0xB6"/>
-    <ins name="RSHIFT_AND.i64" opcode="0x1B7"/>
+    <ins name="RSHIFT_AND.i32">
+      <opcode val="0xB4" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="RSHIFT_AND.v2i16">
+      <opcode val="0xB5" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="RSHIFT_AND.v4i8">
+      <opcode val="0xB6" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="RSHIFT_AND.i64">
+      <opcode val="0x1B7" start="48" mask="0x1FF"/>
+    </ins>
     <va_mod name="left" start="128" size="1" implied="true"/>
     <desc>
       Right shifts its first source by a specified amount and bitwise ANDs it with the
@@ -2082,10 +2280,18 @@
   </group>
 
   <group name="LSHIFT_OR" title="Left shift and bitwise OR" dests="1" opcode2="0x101" unused="true" unit="SFU">
-    <ins name="LSHIFT_OR.i32" opcode="0xB4"/>
-    <ins name="LSHIFT_OR.v2i16" opcode="0xB5"/>
-    <ins name="LSHIFT_OR.v4i8" opcode="0xB6"/>
-    <ins name="LSHIFT_OR.i64" opcode="0x1B7"/>
+    <ins name="LSHIFT_OR.i32">
+      <opcode val="0xB4" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="LSHIFT_OR.v2i16">
+      <opcode val="0xB5" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="LSHIFT_OR.v4i8">
+      <opcode val="0xB6" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="LSHIFT_OR.i64">
+      <opcode val="0x1B7" start="48" mask="0x1FF"/>
+    </ins>
     <va_mod name="left" start="128" size="1" implied="true"/>
     <desc>
       Left shifts its first source by a specified amount and bitwise ORs it with the
@@ -2098,10 +2304,18 @@
   </group>
 
   <group name="RSHIFT_OR" title="Right shift and bitwise OR" dests="1" opcode2="0x001" unused="true" unit="SFU">
-    <ins name="RSHIFT_OR.i32" opcode="0xB4"/>
-    <ins name="RSHIFT_OR.v2i16" opcode="0xB5"/>
-    <ins name="RSHIFT_OR.v4i8" opcode="0xB6"/>
-    <ins name="RSHIFT_OR.i64" opcode="0x1B7"/>
+    <ins name="RSHIFT_OR.i32">
+      <opcode val="0xB4" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="RSHIFT_OR.v2i16">
+      <opcode val="0xB5" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="RSHIFT_OR.v4i8">
+      <opcode val="0xB6" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="RSHIFT_OR.i64">
+      <opcode val="0x1B7" start="48" mask="0x1FF"/>
+    </ins>
     <va_mod name="left" start="128" size="1" implied="true"/>
     <desc>
       Right shifts its first source by a specified amount and bitwise ORs it with the
@@ -2117,10 +2331,18 @@
   </group>
 
   <group name="LSHIFT_XOR" title="Left shift and bitwise XOR" dests="1" opcode2="0x102" unused="true" unit="SFU">
-    <ins name="LSHIFT_XOR.i32" opcode="0xB4"/>
-    <ins name="LSHIFT_XOR.v2i16" opcode="0xB5"/>
-    <ins name="LSHIFT_XOR.v4i8" opcode="0xB6"/>
-    <ins name="LSHIFT_XOR.i64" opcode="0x1B7"/>
+    <ins name="LSHIFT_XOR.i32">
+      <opcode val="0xB4" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="LSHIFT_XOR.v2i16">
+      <opcode val="0xB5" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="LSHIFT_XOR.v4i8">
+      <opcode val="0xB6" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="LSHIFT_XOR.i64">
+      <opcode val="0x1B7" start="48" mask="0x1FF"/>
+    </ins>
     <va_mod name="left" start="128" size="1" implied="true"/>
     <desc>
       Left shifts its first source by a specified amount and bitwise XORs it with the
@@ -2133,10 +2355,18 @@
   </group>
 
   <group name="RSHIFT_XOR" title="Right shift and bitwise XOR" dests="1" opcode2="0x002" unused="true" unit="SFU">
-    <ins name="RSHIFT_XOR.i32" opcode="0xB4"/>
-    <ins name="RSHIFT_XOR.v2i16" opcode="0xB5"/>
-    <ins name="RSHIFT_XOR.v4i8" opcode="0xB6"/>
-    <ins name="RSHIFT_XOR.i64" opcode="0x1B7"/>
+    <ins name="RSHIFT_XOR.i32">
+      <opcode val="0xB4" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="RSHIFT_XOR.v2i16">
+      <opcode val="0xB5" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="RSHIFT_XOR.v4i8">
+      <opcode val="0xB6" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="RSHIFT_XOR.i64">
+      <opcode val="0x1B7" start="48" mask="0x1FF"/>
+    </ins>
     <va_mod name="left" start="128" size="1" implied="true"/>
     <desc>
       Right shifts its first source by a specified amount and bitwise XORs it with the
@@ -2151,7 +2381,8 @@
     <src not="true">B</src>
   </group>
 
-  <ins name="MUX.i32" title="Mux" dests="1" opcode="0xB8" unused="true" unit="SFU">
+  <ins name="MUX.i32" title="Mux" dests="1" unused="true" unit="SFU">
+    <opcode val="0xB8" start="48" mask="0x1FF"/>
     <desc>
       Mux between A and B based on the provided mask. The condition specified
       as the `mux` modifier is evaluated on the mask. If true, `A` is chosen,
@@ -2165,7 +2396,8 @@
     <src>Mask</src>
   </ins>
 
-  <ins name="MUX.v2i16" title="Mux" dests="1" opcode="0xB9" unused="true" unit="SFU">
+  <ins name="MUX.v2i16" title="Mux" dests="1" unused="true" unit="SFU">
+    <opcode val="0xB9" start="48" mask="0x1FF"/>
     <desc>
       Mux between A and B based on the provided mask. The condition specified
       as the `mux` modifier is evaluated on the mask. If true, `A` is chosen,
@@ -2179,7 +2411,8 @@
     <src swizzle="true">Mask</src>
   </ins>
 
-  <ins name="MUX.v4i8" title="Mux" dests="1" opcode="0xBA" unused="true" unit="SFU">
+  <ins name="MUX.v4i8" title="Mux" dests="1" unused="true" unit="SFU">
+    <opcode val="0xBA" start="48" mask="0x1FF"/>
     <desc>
       Mux between A and B based on the provided mask. The condition specified
       as the `mux` modifier is evaluated on the mask. If true, `A` is chosen,
@@ -2193,21 +2426,24 @@
     <src>Mask</src>
   </ins>
 
-  <ins name="CUBE_SSEL" title="Cube S-coordinate select" dests="1" opcode="0xBC" opcode2="0" unused="true" unit="SFU">
+  <ins name="CUBE_SSEL" title="Cube S-coordinate select" dests="1" opcode2="0" unused="true" unit="SFU">
+    <opcode val="0xBC" start="48" mask="0x1FF"/>
     <desc>During a cube map transform, select the S coordinate given a selected face.</desc>
     <src absneg="true">Z coordinate as 32-bit floating point</src>
     <src absneg="true">X coordinate as 32-bit floating point</src>
     <src>Cube face index</src>
   </ins>
 
-  <ins name="CUBE_TSEL" title="Cube T-coordinate select" dests="1" opcode="0xBC" opcode2="1" unused="true" unit="SFU">
+  <ins name="CUBE_TSEL" title="Cube T-coordinate select" dests="1" opcode2="1" unused="true" unit="SFU">
+    <opcode val="0xBC" start="48" mask="0x1FF"/>
     <desc>During a cube map transform, select the T coordinate given a selected face.</desc>
     <src absneg="true">Y coordinate as 32-bit floating point</src>
     <src absneg="true">Z coordinate as 32-bit floating point</src>
     <src>Cube face index</src>
   </ins>
 
-  <ins name="MKVEC.v2i8" title="Make 8-bit vector" dests="1" opcode="0xBD" unit="CVT">
+  <ins name="MKVEC.v2i8" title="Make 8-bit vector" dests="1" unit="CVT">
+    <opcode val="0xBD" start="48" mask="0x1FF"/>
     <desc>
       Calculates $A | (B \ll 8) | (CD \ll 16)$ for 8-bit A and B and 16-bit CD.
 
@@ -2222,21 +2458,24 @@
     <src>CD</src>
   </ins>
 
-  <ins name="CUBEFACE1" title="Cube map transform step 1" dests="1" opcode="0xC0" unused="true" unit="SFU">
+  <ins name="CUBEFACE1" title="Cube map transform step 1" dests="1" unused="true" unit="SFU">
+    <opcode val="0xC0" start="48" mask="0x1FF"/>
     <desc>Select the maximum absolute value of its arguments.</desc>
     <src absneg="true">X coordinate as 32-bit floating point</src>
     <src absneg="true">Y coordinate as 32-bit floating point</src>
     <src absneg="true">Z coordinate as 32-bit floating point</src>
   </ins>
 
-  <ins name="CUBEFACE2_V9" title="Cube map transform step 2" dests="1" opcode="0xC1" unit="SFU">
+  <ins name="CUBEFACE2_V9" title="Cube map transform step 2" dests="1" unit="SFU">
+    <opcode val="0xC1" start="48" mask="0x1FF"/>
     <desc>Select the cube face index corresponding to the arguments.</desc>
     <src absneg="true">X coordinate as 32-bit floating point</src>
     <src absneg="true">Y coordinate as 32-bit floating point</src>
     <src absneg="true">Z coordinate as 32-bit floating point</src>
   </ins>
 
-  <group name="IDPADD" title="8-bit dot product and accumulate" dests="1" opcode="0xC2" unit="FMA">
+  <group name="IDPADD" title="8-bit dot product and accumulate" dests="1" unit="FMA">
+    <opcode val="0xC2" start="48" mask="0x1FF"/>
     <desc>
       8-bit integer dot product between 4 channel vectors, intended for machine
       learning. Available in both unsigned and signed variants, controlling
@@ -2264,10 +2503,16 @@
       for chaining together conditions without intermediate bitwise arithmetic;
       when this is not desired, tie it to zero.
     </desc>
-    <ins name="ICMP_OR.u32" opcode="0xF0"/>
-    <ins name="ICMP_OR.v2u16" opcode="0xF1"/>
+    <ins name="ICMP_OR.u32">
+      <opcode val="0xF0" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="ICMP_OR.v2u16">
+      <opcode val="0xF1" start="48" mask="0x1FF"/>
+    </ins>
     <!-- Removed on v11 -->
-    <ins name="ICMP_OR.v4u8" opcode="0xF2"/>
+    <ins name="ICMP_OR.v4u8">
+      <opcode val="0xF2" start="48" mask="0x1FF"/>
+    </ins>
     <cmp int_only="true"/>
     <result_type/>
     <src widen="true">A</src>
@@ -2282,10 +2527,16 @@
       one, integer minus one, or floating-point one). The third source is useful
       for chaining together conditions without intermediate bitwise arithmetic.
     </desc>
-    <ins name="ICMP_AND.u32" opcode="0xF0"/>
-    <ins name="ICMP_AND.v2u16" opcode="0xF1"/>
+    <ins name="ICMP_AND.u32">
+      <opcode val="0xF0" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="ICMP_AND.v2u16">
+      <opcode val="0xF1" start="48" mask="0x1FF"/>
+    </ins>
     <!-- Removed on v11 -->
-    <ins name="ICMP_AND.v4u8" opcode="0xF2"/>
+    <ins name="ICMP_AND.v4u8">
+      <opcode val="0xF2" start="48" mask="0x1FF"/>
+    </ins>
     <cmp int_only="true"/>
     <result_type/>
     <src widen="true">A</src>
@@ -2301,8 +2552,12 @@
       for chaining together conditions without intermediate bitwise arithmetic;
       when this is not desired, tie it to zero.
     </desc>
-    <ins name="FCMP_OR.f32" opcode="0xF4"/>
-    <ins name="FCMP_OR.v2f16" opcode="0xF5"/>
+    <ins name="FCMP_OR.f32">
+      <opcode val="0xF4" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="FCMP_OR.v2f16">
+      <opcode val="0xF5" start="48" mask="0x1FF"/>
+    </ins>
     <cmp/>
     <result_type/>
     <src absneg="true" swizzle="true">A</src>
@@ -2317,8 +2572,12 @@
       one, integer minus one, or floating-point one). The third source is useful
       for chaining together conditions without intermediate bitwise arithmetic.
     </desc>
-    <ins name="FCMP_AND.f32" opcode="0xF4"/>
-    <ins name="FCMP_AND.v2f16" opcode="0xF5"/>
+    <ins name="FCMP_AND.f32">
+      <opcode val="0xF4" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="FCMP_AND.v2f16">
+      <opcode val="0xF5" start="48" mask="0x1FF"/>
+    </ins>
     <cmp/>
     <result_type/>
     <src absneg="true" swizzle="true">A</src>
@@ -2333,10 +2592,16 @@
       one, integer minus one, or floating-point one). The third source is useful
       for chaining together conditions without intermediate bitwise arithmetic.
     </desc>
-    <ins name="ICMP_OR.s32" opcode="0xF8"/>
-    <ins name="ICMP_OR.v2s16" opcode="0xF9"/>
+    <ins name="ICMP_OR.s32">
+      <opcode val="0xF8" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="ICMP_OR.v2s16">
+      <opcode val="0xF9" start="48" mask="0x1FF"/>
+    </ins>
     <!-- Removed on v11 -->
-    <ins name="ICMP_OR.v4s8" opcode="0xFA"/>
+    <ins name="ICMP_OR.v4s8">
+      <opcode val="0xFA" start="48" mask="0x1FF"/>
+    </ins>
     <cmp int_only="true"/>
     <result_type/>
     <src widen="true">A</src>
@@ -2351,10 +2616,16 @@
       one, integer minus one, or floating-point one). The third source is useful
       for chaining together conditions without intermediate bitwise arithmetic.
     </desc>
-    <ins name="ICMP_AND.s32" opcode="0xF8"/>
-    <ins name="ICMP_AND.v2s16" opcode="0xF9"/>
+    <ins name="ICMP_AND.s32">
+      <opcode val="0xF8" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="ICMP_AND.v2s16">
+      <opcode val="0xF9" start="48" mask="0x1FF"/>
+    </ins>
     <!-- Removed on v11 -->
-    <ins name="ICMP_AND.v4s8" opcode="0xFA"/>
+    <ins name="ICMP_AND.v4s8">
+      <opcode val="0xFA" start="48" mask="0x1FF"/>
+    </ins>
     <cmp int_only="true"/>
     <result_type/>
     <src widen="true">A</src>
@@ -2376,8 +2647,12 @@
       result type on the low half, the `m1` result type on the high half, and
       the result of the low half comparison passed as the third source.
     </desc>
-    <ins name="ICMP_MULTI.u32" opcode="0xF0"/>
-    <ins name="ICMP_MULTI.s32" opcode="0xF8"/>
+    <ins name="ICMP_MULTI.u32">
+      <opcode val="0xF0" start="48" mask="0x1FF"/>
+    </ins>
+    <ins name="ICMP_MULTI.s32">
+      <opcode val="0xF8" start="48" mask="0x1FF"/>
+    </ins>
     <cmp int_only="true"/>
     <result_type/>
     <src widen="true">A</src>
@@ -2385,7 +2660,8 @@
     <src>C</src>
   </group>
 
-  <ins name="IADD_IMM.i32" title="Integer addition with immediate" dests="1" opcode="0x110" unit="CVT">
+  <ins name="IADD_IMM.i32" title="Integer addition with immediate" dests="1" unit="CVT">
+    <opcode val="0x110" start="48" mask="0x1FF"/>
     <desc>
       Adds an arbitrary 32-bit immediate embedded within the instruction stream.
       If no modifiers are required, this is preferred to `IADD.i32` with a
@@ -2398,7 +2674,8 @@
     <imm name="constant" ir_name="index" start="8" size="32"/>
   </ins>
 
-  <ins name="IADD_IMM.v2i16" title="Integer addition with immediate" dests="1" opcode="0x111" unit="CVT">
+  <ins name="IADD_IMM.v2i16" title="Integer addition with immediate" dests="1" unit="CVT">
+    <opcode val="0x111" start="48" mask="0x1FF"/>
     <desc>
       Adds an arbitrary pair of 16-bit immediates embedded within the
       instruction stream. If no modifiers are required, this is preferred to
@@ -2411,7 +2688,8 @@
   </ins>
 
   <!-- Removed on v11 -->
-  <ins name="IADD_IMM.v4i8" title="Integer addition with immediate" dests="1" opcode="0x112" unit="CVT">
+  <ins name="IADD_IMM.v4i8" title="Integer addition with immediate" dests="1" unit="CVT">
+    <opcode val="0x112" start="48" mask="0x1FF"/>
     <desc>
       Adds an arbitrary quad of 8-bit immediates embedded within the
       instruction stream. If no modifiers are required, this is preferred to
@@ -2423,7 +2701,8 @@
     <imm name="constant" ir_name="index" start="8" size="32"/>
   </ins>
 
-  <ins name="FADD_IMM.f32" title="Floating-point addition with immediate" dests="1" opcode="0x114" unit="FMA">
+  <ins name="FADD_IMM.f32" title="Floating-point addition with immediate" dests="1" unit="FMA">
+    <opcode val="0x114" start="48" mask="0x1FF"/>
     <desc>
       Adds an arbitrary 32-bit immediate embedded within the instruction stream.
       If no modifiers are required, this is preferred to `FADD.f32` with a
@@ -2434,7 +2713,8 @@
     <imm name="constant" ir_name="index" start="8" size="32"/>
   </ins>
 
-  <ins name="FADD_IMM.v2f16" title="Floating-point addition with immediate" dests="1" opcode="0x115" unit="FMA">
+  <ins name="FADD_IMM.v2f16" title="Floating-point addition with immediate" dests="1" unit="FMA">
+    <opcode val="0x115" start="48" mask="0x1FF"/>
     <desc>
       Adds an arbitrary pair of 16-bit immediates embedded within the
       instruction stream. If no modifiers are required, this is preferred to
@@ -2446,7 +2726,8 @@
     <imm name="constant" ir_name="index" start="8" size="32"/>
   </ins>
 
-  <ins name="ATOM1_RETURN.i32" title="Atomic operations on memory with 1" opcode="0x69" opcode2="3" unused="true" unit="LS">
+  <ins name="ATOM1_RETURN.i32" title="Atomic operations on memory with 1" opcode2="3" unused="true" unit="LS">
+    <opcode val="0x69" start="48" mask="0x1FF"/>
     <slot/>
     <sr_count/>
     <atom_opc_1/>
@@ -2458,7 +2739,8 @@
     <imm name="offset" start="8" size="8"/>
   </ins>
 
-  <ins name="ATOM1_RETURN.i64" title="Atomic operations on memory with 1" opcode="0x69" opcode2="5" unused="true" unit="LS">
+  <ins name="ATOM1_RETURN.i64" title="Atomic operations on memory with 1" opcode2="5" unused="true" unit="LS">
+    <opcode val="0x69" start="48" mask="0x1FF"/>
     <slot/>
     <sr_count/>
     <atom_opc_1/>
@@ -2470,7 +2752,8 @@
     <imm name="offset" start="8" size="8"/>
   </ins>
 
-  <ins name="ATOM.i32" title="Atomic operations on memory" opcode="0x68" opcode2="3" unused="true" unit="LS">
+  <ins name="ATOM.i32" title="Atomic operations on memory" opcode2="3" unused="true" unit="LS">
+    <opcode val="0x68" start="48" mask="0x1FF"/>
     <slot/>
     <sr_count/>
     <atom_opc/>
@@ -2481,7 +2764,8 @@
     <imm name="offset" start="8" size="8"/>
   </ins>
 
-  <ins name="ATOM.i64" title="Atomic operations on memory" opcode="0x68" opcode2="5" unused="true" unit="LS">
+  <ins name="ATOM.i64" title="Atomic operations on memory" opcode2="5" unused="true" unit="LS">
+    <opcode val="0x68" start="48" mask="0x1FF"/>
     <slot/>
     <sr_count/>
     <atom_opc/>
@@ -2492,7 +2776,8 @@
     <imm name="offset" start="8" size="8"/>
   </ins>
 
-  <ins name="ATOM_RETURN.i32" title="Atomic operations on memory" opcode="0x120" opcode2="3" unused="true" unit="LS">
+  <ins name="ATOM_RETURN.i32" title="Atomic operations on memory" opcode2="3" unused="true" unit="LS">
+    <opcode val="0x120" start="48" mask="0x1FF"/>
     <slot/>
     <sr_count/>
     <sr_write_count/>
@@ -2509,7 +2794,8 @@
     <imm name="offset" start="8" size="8"/>
   </ins>
 
-  <ins name="ATOM_RETURN.i64" title="Atomic operations on memory" opcode="0x120" opcode2="5" unused="true" unit="LS">
+  <ins name="ATOM_RETURN.i64" title="Atomic operations on memory" opcode2="5" unused="true" unit="LS">
+    <opcode val="0x120" start="48" mask="0x1FF"/>
     <slot/>
     <sr_count/>
     <sr_write_count/>
@@ -2526,7 +2812,8 @@
     <imm name="offset" start="8" size="8"/>
   </ins>
 
-  <ins name="TEX_FETCH" title="Texel fetch" opcode="0x125" message="tex" unit="T">
+  <ins name="TEX_FETCH" title="Texel fetch" message="tex" unit="T">
+    <opcode val="0x125" start="48" mask="0x1FF"/>
     <desc>Unfiltered textured instruction.</desc>
     <slot/>
     <skip/>
@@ -2550,7 +2837,8 @@
     <immediate name="sr_count" size="4" pseudo="true"/>
   </ins>
 
-  <ins name="TEX_SINGLE" title="Texture load" opcode="0x128" message="tex" unit="T">
+  <ins name="TEX_SINGLE" title="Texture load" message="tex" unit="T">
+    <opcode val="0x128" start="48" mask="0x1FF"/>
     <desc>Ordinary texturing instruction using a sampler.</desc>
     <slot/>
     <skip/>
@@ -2576,7 +2864,8 @@
     <immediate name="sr_count" size="4" pseudo="true"/>
   </ins>
 
-  <ins name="TEX_GATHER" title="Texel gather" opcode="0x129" message="tex" unit="T">
+  <ins name="TEX_GATHER" title="Texel gather" message="tex" unit="T">
+    <opcode val="0x129" start="48" mask="0x1FF"/>
     <desc>Texture gather instruction.</desc>
     <slot/>
     <skip/>
@@ -2603,7 +2892,8 @@
     <immediate name="sr_count" size="4" pseudo="true"/>
   </ins>
 
-  <ins name="TEX_GRADIENT" title="Texture gradient" opcode="0x12A" message="tex" unit="T">
+  <ins name="TEX_GRADIENT" title="Texture gradient" message="tex" unit="T">
+    <opcode val="0x12A" start="48" mask="0x1FF"/>
     <desc>Texture sample with explicit gradient.</desc>
     <slot/>
     <skip/>
@@ -2627,7 +2917,8 @@
     <immediate name="sr_count" size="4" pseudo="true"/>
   </ins>
 
-  <ins name="TEX_DUAL" title="Dual texture" opcode="0x12F" unused="true" unit="T">
+  <ins name="TEX_DUAL" title="Dual texture" unused="true" unit="T">
+    <opcode val="0x12F" start="48" mask="0x1FF"/>
     <desc>Pair of texture instructions.</desc>
     <slot/>
     <skip/>
@@ -2650,7 +2941,8 @@
     <src size="64">Image to read from</src>
   </ins>
 
-  <ins name="VAR_TEX_BUF_SINGLE" title="Fused varying-texturing" opcode="0x130" unused="true" unit="VT">
+  <ins name="VAR_TEX_BUF_SINGLE" title="Fused varying-texturing" unused="true" unit="VT">
+    <opcode val="0x130" start="48" mask="0x1FF"/>
     <desc>
       Only works for FP32 varyings. Performance characteristics are similar
       to LD_VAR_BUF_IMM_F32.v2.f32 followed by TEX, using both V and T units.
@@ -2672,7 +2964,8 @@
     <src>Varying offset</src>
   </ins>
 
-  <ins name="VAR_TEX_BUF_GATHER" title="Fused varying-texturing" opcode="0x131" unused="true" unit="VT">
+  <ins name="VAR_TEX_BUF_GATHER" title="Fused varying-texturing" unused="true" unit="VT">
+    <opcode val="0x131" start="48" mask="0x1FF"/>
     <desc>
       Only works for FP32 varyings. Performance characteristics are similar
       to LD_VAR_BUF_IMM_F32.v2.f32 followed by TEX, using both V and T units.
@@ -2695,7 +2988,8 @@
     <src>Varying offset</src>
   </ins>
 
-  <ins name="VAR_TEX_BUF_GRADIENT" title="Fused varying-texturing" opcode="0x132" unused="true" unit="VT">
+  <ins name="VAR_TEX_BUF_GRADIENT" title="Fused varying-texturing" unused="true" unit="VT">
+    <opcode val="0x132" start="48" mask="0x1FF"/>
     <desc>
       Only works for FP32 varyings. Performance characteristics are similar
       to LD_VAR_BUF_IMM_F32.v2.f32 followed by TEX, using both V and T units.
@@ -2718,7 +3012,8 @@
     <src>Varying offset</src>
   </ins>
 
-  <ins name="VAR_TEX_BUF_DUAL" title="Fused varying-texturing" opcode="0x137" unused="true" unit="VT">
+  <ins name="VAR_TEX_BUF_DUAL" title="Fused varying-texturing" unused="true" unit="VT">
+    <opcode val="0x137" start="48" mask="0x1FF"/>
     <desc>
       Only works for FP32 varyings. Performance characteristics are similar
       to LD_VAR_BUF_IMM_F32.v2.f32 followed by TEX_DUAL, using both V and T units.
@@ -2740,7 +3035,8 @@
     <src>Varying offset</src>
   </ins>
 
-  <ins name="VAR_TEX_SINGLE" title="Fused varying-texturing" opcode="0x138" unused="true" unit="VT">
+  <ins name="VAR_TEX_SINGLE" title="Fused varying-texturing" unused="true" unit="VT">
+    <opcode val="0x138" start="48" mask="0x1FF"/>
     <desc>
       Only works for FP32 varyings. Performance characteristics are similar
       to LD_VAR_IMM_F32.v2.f32 followed by TEX, using both V and T units.
@@ -2762,7 +3058,8 @@
     <src>Varying offset</src>
   </ins>
 
-  <ins name="VAR_TEX_GATHER" title="Fused varying-texturing" opcode="0x139" unused="true" unit="VT">
+  <ins name="VAR_TEX_GATHER" title="Fused varying-texturing" unused="true" unit="VT">
+    <opcode val="0x139" start="48" mask="0x1FF"/>
     <desc>
       Only works for FP32 varyings. Performance characteristics are similar
       to LD_VAR_IMM_F32.v2.f32 followed by TEX, using both V and T units.
@@ -2785,7 +3082,8 @@
     <src>Varying offset</src>
   </ins>
 
-  <ins name="VAR_TEX_GRADIENT" title="Fused varying-texturing" opcode="0x13A" unused="true" unit="VT">
+  <ins name="VAR_TEX_GRADIENT" title="Fused varying-texturing" unused="true" unit="VT">
+    <opcode val="0x13A" start="48" mask="0x1FF"/>
     <desc>
       Only works for FP32 varyings. Performance characteristics are similar
       to LD_VAR_IMM_F32.v2.f32 followed by TEX, using both V and T units.
@@ -2808,7 +3106,8 @@
     <src>Varying offset</src>
   </ins>
 
-  <ins name="VAR_TEX_DUAL" title="Fused varying-texturing" opcode="0x13F" unused="true" unit="VT">
+  <ins name="VAR_TEX_DUAL" title="Fused varying-texturing" unused="true" unit="VT">
+    <opcode val="0x13F" start="48" mask="0x1FF"/>
     <desc>
       Only works for FP32 varyings. Performance characteristics are similar
       to LD_VAR_IMM_F32.v2.f32 followed by TEX_DUAL, using both V and T units.
@@ -2830,7 +3129,8 @@
     <src>Varying offset</src>
   </ins>
 
-  <ins name="FMA_RSCALE.f32" title="Fused floating-point multiply add with exponent bias" dests="1" opcode="0x160" unused="true" unit="FMA">
+  <ins name="FMA_RSCALE.f32" title="Fused floating-point multiply add with exponent bias" dests="1" unused="true" unit="FMA">
+    <opcode val="0x160" start="48" mask="0x1FF"/>
     <desc>
       First calculates $A \cdot B + C$ and then biases the exponent by D. Used in
       special transcendental function sequences. It should not be used for
@@ -2845,7 +3145,8 @@
     <src>D</src>
   </ins>
 
-  <ins name="FMA_RSCALE_N.f32" title="Fused floating-point multiply add with exponent bias and zero override" dests="1" opcode="0x161" unused="true" unit="FMA">
+  <ins name="FMA_RSCALE_N.f32" title="Fused floating-point multiply add with exponent bias and zero override" dests="1" unused="true" unit="FMA">
+    <opcode val="0x161" start="48" mask="0x1FF"/>
     <desc>
       First calculates $A \cdot B + C$ and then biases the exponent by D. If $A
       = 0$ or $B = 0$, the multiply $A \cdot B$ is treated as zero even if an
@@ -2861,7 +3162,8 @@
     <src>D</src>
   </ins>
 
-  <ins name="FMA_RSCALE_LEFT.f32" title="Fused floating-point multiply add with exponent bias and asymmetric zero handling" dests="1" opcode="0x162" unused="true" unit="FMA">
+  <ins name="FMA_RSCALE_LEFT.f32" title="Fused floating-point multiply add with exponent bias and asymmetric zero handling" dests="1" unused="true" unit="FMA">
+    <opcode val="0x162" start="48" mask="0x1FF"/>
     <desc>
       First calculates $A \cdot B + C$ and then biases the exponent by D. If $A
       = 0$ or $B = 0$, the multiply is treated as $A$ even if an
@@ -2877,7 +3179,8 @@
     <src>D</src>
   </ins>
 
-  <ins name="FMA_RSCALE_SCALE16.f32" title="Fused floating-point multiply add with 16-bit exponent bias" dests="1" opcode="0x163" unused="true" unit="FMA">
+  <ins name="FMA_RSCALE_SCALE16.f32" title="Fused floating-point multiply add with 16-bit exponent bias" dests="1" unused="true" unit="FMA">
+    <opcode val="0x163" start="48" mask="0x1FF"/>
     <desc>
       First calculates $A \cdot B + C$ and then biases the exponent by D,
       interpreted as a 16-bit value. Used in special transcendental function
diff --git a/src/panfrost/compiler/bifrost/valhall/asm.py b/src/panfrost/compiler/bifrost/valhall/asm.py
index 8301789bb06..560a2b1834d 100644
--- a/src/panfrost/compiler/bifrost/valhall/asm.py
+++ b/src/panfrost/compiler/bifrost/valhall/asm.py
@@ -315,7 +315,7 @@ def parse_asm(line):
     operands = operands[len(ins.immediates):]
 
     # Encode the operation itself
-    encoded |= (ins.opcode << 48)
+    encoded |= (ins.opcode.value << ins.opcode.start)
     encoded |= (ins.opcode2 << ins.secondary_shift)
 
     # Encode FAU page
diff --git a/src/panfrost/compiler/bifrost/valhall/disasm.py b/src/panfrost/compiler/bifrost/valhall/disasm.py
index 58ac0de8c4e..fca5f87f877 100644
--- a/src/panfrost/compiler/bifrost/valhall/disasm.py
+++ b/src/panfrost/compiler/bifrost/valhall/disasm.py
@@ -271,7 +271,7 @@ disassemble_valhall(FILE *fp, const void *code, size_t size, bool verbose)
 # Bucket by opcode for hierarchical disassembly
 OPCODE_BUCKETS = {}
 for ins in instructions:
-    opc = ins.opcode
+    opc = ins.opcode.value
     OPCODE_BUCKETS[opc] = OPCODE_BUCKETS.get(opc, []) + [ins]
 
 # Check that each bucket may be disambiguated
diff --git a/src/panfrost/compiler/bifrost/valhall/valhall.c.py b/src/panfrost/compiler/bifrost/valhall/valhall.c.py
index ea1a559b072..47f7d4a328a 100644
--- a/src/panfrost/compiler/bifrost/valhall/valhall.c.py
+++ b/src/panfrost/compiler/bifrost/valhall/valhall.c.py
@@ -147,7 +147,7 @@ valhall_opcodes[BI_NUM_OPCODES] = {
 
 # Exact value to be ORed in to every opcode
 def exact_op(op):
-    return (op.opcode << 48) | (op.opcode2 << op.secondary_shift)
+    return (op.opcode.value << op.opcode.start) | (op.opcode2 << op.secondary_shift)
 
 try:
     print(Template(template).render(immediates = immediates, instructions = instructions, skip = SKIP, exact = exact_op, typesize = typesize))
diff --git a/src/panfrost/compiler/bifrost/valhall/valhall.py b/src/panfrost/compiler/bifrost/valhall/valhall.py
index a3bd52e5191..0ac517a47e4 100644
--- a/src/panfrost/compiler/bifrost/valhall/valhall.py
+++ b/src/panfrost/compiler/bifrost/valhall/valhall.py
@@ -157,6 +157,12 @@ class Immediate:
         self.size = size
         self.signed = signed
 
+class Opcode:
+    def __init__(self, value, start, mask):
+        self.value = value
+        self.start = start
+        self.mask = mask
+
 class Instruction:
     def __init__(self, name, opcode, opcode2, srcs = [], dests = [], immediates = [], modifiers = [], staging = None, unit = None):
         self.name = name
@@ -179,7 +185,7 @@ class Instruction:
             self.secondary_mask |= 0x100
         if len(srcs) == 3 and (srcs[1].widen or srcs[1].lanes or srcs[1].swizzle):
             self.secondary_mask &= ~0xC # conflicts
-        if opcode == 0x90:
+        if opcode.value == 0x90:
             # XXX: XMLify this, but disambiguates sign of conversions
             self.secondary_mask |= 0x10
         if name.startswith("LOAD.i") or name.startswith("STORE.i") or name.startswith("LD_PKA.i"):
@@ -238,14 +244,22 @@ def build_modifier(el):
 
     return Modifier(name, start, size, implied)
 
+def build_opcode(el, name):
+    opcode = el.find(name)
+    if opcode is None:
+        return None
+    value = int(opcode.get('val'), base=0)
+    start = int(opcode.get('start'))
+    mask = int(opcode.get('mask'), base=0)
+    return Opcode(value, start, mask)
+
 # Build a single instruction from XML and group based overrides
 def build_instr(el, overrides = {}):
     # Get overridables
     name = overrides.get('name') or el.attrib.get('name')
-    opcode = overrides.get('opcode') or el.attrib.get('opcode')
+    opcode = overrides.get('opcode') or build_opcode(el, 'opcode')
     opcode2 = overrides.get('opcode2') or el.attrib.get('opcode2')
     unit = overrides.get('unit') or el.attrib.get('unit')
-    opcode = int(opcode, base=0)
     opcode2 = int(opcode2, base=0) if opcode2 else None
 
     # Get explicit sources/dests
@@ -295,7 +309,7 @@ def build_group(el):
     for ins in el.findall('ins'):
         build_instr(el, overrides = {
             'name': ins.attrib['name'],
-            'opcode': ins.attrib.get('opcode'),
+            'opcode': build_opcode(ins, 'opcode'),
             'opcode2': ins.attrib.get('opcode2'),
             'unit': ins.attrib.get('unit'),
         })
@@ -335,16 +349,16 @@ def safe_name(name):
     return name.lower()
 
 # Parses out the size part of an opcode name
-def typesize(opcode):
-    if opcode[-3:] == '128':
+def typesize(name):
+    if name[-3:] == '128':
         return 128
-    if opcode[-2:] == '48':
+    if name[-2:] == '48':
         return 48
-    elif opcode[-1] == '8':
+    elif name[-1] == '8':
         return 8
     else:
         try:
-            return int(opcode[-2:])
+            return int(name[-2:])
         except:
             return 32